CaptainCook4D
diff --git a/‎core/config.py
Lines changed: 1 addition & 1 deletion b/‎core/config.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎dataloader/CaptainCookStepDataset.py
Lines changed: 124 additions & 114 deletions b/‎dataloader/CaptainCookStepDataset.py
Lines changed: 124 additions & 114 deletions
@@ -67,7 +67,7 @@ def setup_parser(self):
         parser.add_argument('--features_directory', type=str, default='/data/rohith/captain_cook/features/gopro'
                                                                       '/segments', help='features directory')
         parser.add_argument('--ckpt_directory', type=str, default='/data/rohith/captain_cook/checkpoints', help='checkpoint directory')
-        parser.add_argument('--split', type=str, default='recordings', help='split')
+        parser.add_argument('--split', type=str, default=const.RECORDINGS_SPLIT, help='split')
         parser.add_argument('--variant', type=str, default=const.MLP_VARIANT, help='variant')
         parser.add_argument('--model_name', type=str, default=None, help='model name')
         parser.add_argument('--task_name', type=str, default=const.ERROR_RECOGNITION, help='task name')
 
@@ -5,6 +5,7 @@
 import numpy as np
 import torch
 from torch.utils.data import Dataset
+from constants import Constants as const
 
 
 class CaptainCookStepDataset(Dataset):
@@ -18,124 +19,133 @@ def __init__(self, config, phase, split):
         with open('../annotations/annotation_json/step_annotations.json', 'r') as f:
             self._annotations = json.load(f)
 
+        print("Loaded annotations...... ")
+
         assert self._phase in ["train", "val", "test"], f"Invalid phase: {self._phase}"
-        self._features_directory = self._config.features_directory
 
-        if self._split == 'shuffle':
-            self._recording_ids_file = f"recordings_combined_splits.json"
-            print(f"Loading recording ids from {self._recording_ids_file}")
-
-            with open(f'../er_annotations/{self._recording_ids_file}', 'r') as file:
-                self._recording_ids_json = json.load(file)
-
-            self._recording_ids = self._recording_ids_json['train'] + self._recording_ids_json['val'] + self._recording_ids_json['test']
-
-            self._step_dict = {}
-            step_index_id = 0
-            for recording_id in self._recording_ids:
-                self._normal_step_dict = {}
-                self._error_step_dict = {}
-                normal_index_id = 0
-                error_index_id = 0
-                # 1. Prepare step_id, list(<start, end>) for the recording_id
-                recording_step_dictionary = {}
-                for step in self._annotations[recording_id]['steps']:
-                    if step['start_time'] < 0 or step['end_time'] < 0:
-                        # Ignore missing steps
-                        continue
-                    if recording_step_dictionary.get(step['step_id']) is None:
-                        recording_step_dictionary[step['step_id']] = []
-
-                    recording_step_dictionary[step['step_id']].append(
-                        (math.floor(step['start_time']), math.ceil(step['end_time']), step['has_errors']))
-
-                # 2. Add step start and end time list to the step_dict
-                for step_id in recording_step_dictionary.keys():
-                    # If the step has errors, add it to the error_step_dict, else add it to the normal_step_dict
-                    if recording_step_dictionary[step_id][0][2]:
-                        self._error_step_dict[f'E{error_index_id}'] = (recording_id, recording_step_dictionary[step_id])
-                        error_index_id += 1
-                    else:
-                        self._normal_step_dict[f'N{normal_index_id}'] = (
-                            recording_id, recording_step_dictionary[step_id])
-                        normal_index_id += 1
-
-                np.random.seed(config.seed)
-                np.random.shuffle(list(self._normal_step_dict.keys()))
-                np.random.shuffle(list(self._error_step_dict.keys()))
-
-                normal_step_indices = list(self._normal_step_dict.keys())
-                error_step_indices = list(self._error_step_dict.keys())
-
-                self._split_proportion = [0.75, 0.16, 0.9]
-
-                num_normal_steps = len(normal_step_indices)
-                num_error_steps = len(error_step_indices)
-
-                self._split_proportion_normal = [int(num_normal_steps * self._split_proportion[0]),
-                                                 int(num_normal_steps * (
-                                                         self._split_proportion[0] + self._split_proportion[1]))]
-                self._split_proportion_error = [int(num_error_steps * self._split_proportion[0]),
-                                                int(num_error_steps * (
-                                                        self._split_proportion[0] + self._split_proportion[1]))]
-
-                if phase == 'train':
-                    self._train_normal = normal_step_indices[:self._split_proportion_normal[0]]
-                    self._train_error = error_step_indices[:self._split_proportion_error[0]]
-                    train_indices = self._train_normal + self._train_error
-                    for index_id in train_indices:
-                        self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
-                                                                                    self._error_step_dict.get(index_id))
-                        step_index_id += 1
-                elif phase == 'test':
-                    self._val_normal = normal_step_indices[
-                                       self._split_proportion_normal[0]:self._split_proportion_normal[1]]
-                    self._val_error = error_step_indices[
-                                      self._split_proportion_error[0]:self._split_proportion_error[1]]
-                    val_indices = self._val_normal + self._val_error
-                    for index_id in val_indices:
-                        self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
-                                                                                    self._error_step_dict.get(index_id))
-                        step_index_id += 1
-                elif phase == 'val':
-                    self._test_normal = normal_step_indices[self._split_proportion_normal[1]:]
-                    self._test_error = error_step_indices[self._split_proportion_error[1]:]
-                    test_indices = self._test_normal + self._test_error
-                    for index_id in test_indices:
-                        self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
-                                                                                    self._error_step_dict.get(index_id))
-                        step_index_id += 1
+        self._features_directory = self._config.features_directory
 
+        if self._split == const.STEP_SPLIT:
+            self._init_step_split(config, phase)
         else:
-
-            self._recording_ids_file = f"{self._split}_combined_splits.json"
-
-            print(f"Loading recording ids from {self._recording_ids_file}")
-
-            with open(f'../er_annotations/{self._recording_ids_file}', 'r') as file:
-                self._recording_ids_json = json.load(file)
-
-            self._recording_ids = self._recording_ids_json[self._phase]
-
-            self._step_dict = {}
-            index_id = 0
-            for recording in self._recording_ids:
-                # 1. Prepare step_id, list(<start, end>) for the recording_id
-                recording_step_dictionary = {}
-                for step in self._annotations[recording]['steps']:
-                    if step['start_time'] < 0 or step['end_time'] < 0:
-                        # Ignore missing steps
-                        continue
-                    if recording_step_dictionary.get(step['step_id']) is None:
-                        recording_step_dictionary[step['step_id']] = []
-
-                    recording_step_dictionary[step['step_id']].append(
-                        (math.floor(step['start_time']), math.ceil(step['end_time']), step['has_errors']))
-
-                # 2. Add step start and end time list to the step_dict
-                for step_id in recording_step_dictionary.keys():
-                    self._step_dict[index_id] = (recording, recording_step_dictionary[step_id])
-                    index_id += 1
+            self._init_other_split_from_file(config, phase)
+
+    def _init_step_split(self, config, phase):
+        self._recording_ids_file = "recordings_combined_splits.json"
+        print(f"Loading recording ids from {self._recording_ids_file}")
+        # annotations_file_path = os.path.join(os.path.dirname(__file__), f'../er_annotations/{
+        # self._recording_ids_file}')
+        annotations_file_path = f"/home/rxp190007/CODE/error_recognition/er_annotations/{self._recording_ids_file}"
+        with open(f'{annotations_file_path}', 'r') as file:
+            self._recording_ids_json = json.load(file)
+
+        self._recording_ids = self._recording_ids_json['train'] + self._recording_ids_json['val'] + \
+                              self._recording_ids_json['test']
+
+        self._step_dict = {}
+        step_index_id = 0
+        for recording_id in self._recording_ids:
+            self._normal_step_dict = {}
+            self._error_step_dict = {}
+            normal_index_id = 0
+            error_index_id = 0
+            # 1. Prepare step_id, list(<start, end>) for the recording_id
+            recording_step_dictionary = {}
+            for step in self._annotations[recording_id]['steps']:
+                if step['start_time'] < 0 or step['end_time'] < 0:
+                    # Ignore missing steps
+                    continue
+                if recording_step_dictionary.get(step['step_id']) is None:
+                    recording_step_dictionary[step['step_id']] = []
+
+                recording_step_dictionary[step['step_id']].append(
+                    (math.floor(step['start_time']), math.ceil(step['end_time']), step['has_errors']))
+
+            # 2. Add step start and end time list to the step_dict
+            for step_id in recording_step_dictionary.keys():
+                # If the step has errors, add it to the error_step_dict, else add it to the normal_step_dict
+                if recording_step_dictionary[step_id][0][2]:
+                    self._error_step_dict[f'E{error_index_id}'] = (recording_id, recording_step_dictionary[step_id])
+                    error_index_id += 1
+                else:
+                    self._normal_step_dict[f'N{normal_index_id}'] = (
+                        recording_id, recording_step_dictionary[step_id])
+                    normal_index_id += 1
+
+            np.random.seed(config.seed)
+            np.random.shuffle(list(self._normal_step_dict.keys()))
+            np.random.shuffle(list(self._error_step_dict.keys()))
+
+            normal_step_indices = list(self._normal_step_dict.keys())
+            error_step_indices = list(self._error_step_dict.keys())
+
+            self._split_proportion = [0.75, 0.16, 0.9]
+
+            num_normal_steps = len(normal_step_indices)
+            num_error_steps = len(error_step_indices)
+
+            self._split_proportion_normal = [int(num_normal_steps * self._split_proportion[0]),
+                                             int(num_normal_steps * (
+                                                     self._split_proportion[0] + self._split_proportion[1]))]
+            self._split_proportion_error = [int(num_error_steps * self._split_proportion[0]),
+                                            int(num_error_steps * (
+                                                    self._split_proportion[0] + self._split_proportion[1]))]
+
+            if phase == 'train':
+                self._train_normal = normal_step_indices[:self._split_proportion_normal[0]]
+                self._train_error = error_step_indices[:self._split_proportion_error[0]]
+                train_indices = self._train_normal + self._train_error
+                for index_id in train_indices:
+                    self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
+                                                                                self._error_step_dict.get(index_id))
+                    step_index_id += 1
+            elif phase == 'test':
+                self._val_normal = normal_step_indices[
+                                   self._split_proportion_normal[0]:self._split_proportion_normal[1]]
+                self._val_error = error_step_indices[
+                                  self._split_proportion_error[0]:self._split_proportion_error[1]]
+                val_indices = self._val_normal + self._val_error
+                for index_id in val_indices:
+                    self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
+                                                                                self._error_step_dict.get(index_id))
+                    step_index_id += 1
+            elif phase == 'val':
+                self._test_normal = normal_step_indices[self._split_proportion_normal[1]:]
+                self._test_error = error_step_indices[self._split_proportion_error[1]:]
+                test_indices = self._test_normal + self._test_error
+                for index_id in test_indices:
+                    self._step_dict[step_index_id] = self._normal_step_dict.get(index_id,
+                                                                                self._error_step_dict.get(index_id))
+                    step_index_id += 1
+
+    def _init_other_split_from_file(self, config, phase):
+        self._recording_ids_file = f"{self._split}_combined_splits.json"
+        # annotations_file_path = os.path.join(os.path.dirname(__file__), f'../er_annotations/{self._recording_ids_file}')
+        annotations_file_path = f"/home/rxp190007/CODE/error_recognition/er_annotations/{self._recording_ids_file}"
+        print(f"Loading recording ids from {self._recording_ids_file}")
+        with open(f'{annotations_file_path}', 'r') as file:
+            self._recording_ids_json = json.load(file)
+
+        self._recording_ids = self._recording_ids_json[phase]
+        self._step_dict = {}
+        index_id = 0
+        for recording in self._recording_ids:
+            # 1. Prepare step_id, list(<start, end>) for the recording_id
+            recording_step_dictionary = {}
+            for step in self._annotations[recording]['steps']:
+                if step['start_time'] < 0 or step['end_time'] < 0:
+                    # Ignore missing steps
+                    continue
+                if recording_step_dictionary.get(step['step_id']) is None:
+                    recording_step_dictionary[step['step_id']] = []
+
+                recording_step_dictionary[step['step_id']].append(
+                    (math.floor(step['start_time']), math.ceil(step['end_time']), step['has_errors']))
+
+            # 2. Add step start and end time list to the step_dict
+            for step_id in recording_step_dictionary.keys():
+                self._step_dict[index_id] = (recording, recording_step_dictionary[step_id])
+                index_id += 1
 
     def __len__(self):
         assert len(self._step_dict) > 0, "No data found in the dataset"