OpenSportsLab
diff --git a/‎.DS_Store‎
6 KB b/‎.DS_Store‎
6 KB
diff --git a/‎annotation_tool/controllers/history_manager.py‎
Lines changed: 64 additions & 2 deletions b/‎annotation_tool/controllers/history_manager.py‎
Lines changed: 64 additions & 2 deletions
diff --git a/‎annotation_tool/controllers/localization/loc_file_manager.py‎
Lines changed: 46 additions & 40 deletions b/‎annotation_tool/controllers/localization/loc_file_manager.py‎
Lines changed: 46 additions & 40 deletions
diff --git a/‎annotation_tool/controllers/localization/loc_inference.py‎
Lines changed: 51 additions & 26 deletions b/‎annotation_tool/controllers/localization/loc_inference.py‎
Lines changed: 51 additions & 26 deletions
@@ -53,7 +53,7 @@ def _refresh_active_view(self):
             # Refresh Events (Table & Timeline)
             self.main.loc_manager._refresh_current_clip_events()
             # Refresh left side
-            self.main.loc_manager.populate_tree()
+            self.main.loc_manager.refresh_tree_icons()
 
         # 2. Description Mode
         elif current_widget == self.main.ui.description_ui:
@@ -201,6 +201,68 @@ def _apply_state_change(self, cmd, is_undo):
 
             self._refresh_active_view()
 
+
+        # =========================================================
+        # Redo/undo for localization smart annotation
+        # =========================================================
+        elif ctype == CmdType.LOC_SMART_CONFIRM:
+            path = cmd['video_path']
+            events = cmd['confirmed_events']
+            
+            smart_events = self.model.smart_localization_events.get(path, [])
+            temp_events = self.model.temp_smart_events.get(path, [])
+            
+            if is_undo:
+                for evt in events:
+                    if evt in smart_events:
+                        smart_events.remove(evt)
+                temp_events.extend(events)
+                temp_events.sort(key=lambda x: x.get('position_ms', 0))
+            else:
+                for evt in events:
+                    if evt in temp_events:
+                        temp_events.remove(evt)
+                smart_events.extend(events)
+                smart_events.sort(key=lambda x: x.get('position_ms', 0))
+                
+            self.model.smart_localization_events[path] = smart_events
+            self.model.temp_smart_events[path] = temp_events
+            
+            self.main.loc_manager.refresh_tree_icons()
+            self.main.loc_manager._display_smart_events(path)
+
+        elif ctype == CmdType.LOC_SMART_EVENT_DEL:
+            path = cmd['video_path']
+            evt = cmd['event']
+            is_confirmed = cmd['is_confirmed']
+            
+            if is_confirmed:
+                events_list = self.model.smart_localization_events.setdefault(path, [])
+            else:
+                events_list = self.model.temp_smart_events.setdefault(path, [])
+                
+            if is_undo:
+                events_list.append(evt)
+                events_list.sort(key=lambda x: x.get('position_ms', 0))
+            else:
+                if evt in events_list:
+                    events_list.remove(evt)
+                    
+            self.main.loc_manager.refresh_tree_icons()
+            self.main.loc_manager._display_smart_events(path)
+
+        elif ctype == CmdType.LOC_SMART_RUN:
+            path = cmd['video_path']
+            old_events = cmd['old_events']
+            new_events = cmd['new_events']
+            
+            if is_undo:
+                self.model.temp_smart_events[path] = copy.deepcopy(old_events)
+            else:
+                self.model.temp_smart_events[path] = copy.deepcopy(new_events)
+                
+            self.main.loc_manager._display_smart_events(path)
+
         # =========================================================
         # 3. Description Specific
         # =========================================================
@@ -430,4 +492,4 @@ def _apply_state_change(self, cmd, is_undo):
                     if evt.get('head') == head and evt.get('label') == src:
                         evt['label'] = dst
 
-            self._refresh_active_view()
+            self._refresh_active_view()
@@ -167,7 +167,8 @@ def load_project(self, data, file_path):
 
             # Process events
             raw_events = item.get("events", [])
-            processed_events = []
+            processed_events = []       
+            processed_smart_events = [] 
 
             if isinstance(raw_events, list):
                 for evt in raw_events:
@@ -178,16 +179,25 @@ def load_project(self, data, file_path):
                     except ValueError:
                         pos_ms = 0
 
-                    processed_events.append(
-                        {
+                    if "confidence" in evt or "score" in evt:
+                        conf = evt.get("confidence", evt.get("score", 1.0))
+                        processed_smart_events.append({
                             "head": evt.get("head", "action"),
                             "label": evt.get("label", "?"),
                             "position_ms": pos_ms,
-                        }
-                    )
+                            "confidence": conf
+                        })
+                    else:
+                        processed_events.append({
+                            "head": evt.get("head", "action"),
+                            "label": evt.get("label", "?"),
+                            "position_ms": pos_ms,
+                        })
 
             if processed_events:
                 self.model.localization_events[final_path] = processed_events
+            if processed_smart_events:
+                self.model.smart_localization_events[final_path] = processed_smart_events
 
             loaded_count += 1
 
@@ -258,35 +268,46 @@ def _write_json(self, path):
 
         for data in sorted_items:
             abs_path = data["path"]
+            
             events = self.model.localization_events.get(abs_path, [])
+            smart_events = self.model.smart_localization_events.get(abs_path, [])
 
-            # Store path as relative if possible
             try:
                 rel_path = os.path.relpath(abs_path, base_dir).replace(os.sep, "/")
             except Exception:
                 rel_path = abs_path
 
-            # Convert events to export format
             export_events = []
+            
             for e in events:
-                export_events.append(
-                    {
-                        "head": e.get("head"),
-                        "label": e.get("label"),
-                        "position_ms": str(e.get("position_ms")),
-                    }
-                )
+                export_events.append({
+                    "head": e.get("head"),
+                    "label": e.get("label"),
+                    "position_ms": int(e.get("position_ms", 0)), 
+                })
+                
+            for e in smart_events:
+                export_events.append({
+                    "head": e.get("head"),
+                    "label": e.get("label"),
+                    "position_ms": int(e.get("position_ms", 0)),
+                    "confidence": float(e.get("confidence", 0.99)) 
+                })
+
+            export_events.sort(key=lambda x: x["position_ms"])
 
             entry = {
+                "id": data.get("name", ""),
                 "inputs": [
                     {
                         "type": "video",
                         "path": rel_path,
                         "fps": 25.0,
                     }
                 ],
-                "events": export_events,
+                "events": export_events 
             }
+
             output["data"].append(entry)
 
         try:
@@ -297,32 +318,10 @@ def _write_json(self, path):
             self.main.statusBar().showMessage(f"Saved — {os.path.basename(path)}", 1500)
             return True
         except Exception as e:
+            from PyQt6.QtWidgets import QMessageBox
             QMessageBox.critical(self.main, "Error", f"Save failed: {e}")
             return False
-        
-        for video_path in sorted(self.model.localization_events.keys()):
-                # 获取该视频所属的原始 item 定义（包含 inputs 视频源信息）
-                base_item = next((item for item in self.model.action_item_data if item["path"] == video_path), None)
-                if not base_item: continue
-                
-                # 1. 获取手工（或已确认的）标注
-                manual_events = self.model.localization_events.get(video_path, [])
-                
-                # 2. 获取未确认的智能标注
-                smart_events = self.model.smart_localization_events.get(video_path, [])
-                
-                # 构建符合 OSL 标准规范的单条数据结构
-                out_item = {
-                    "id": base_item.get("id", ""),
-                    "inputs": [{"path": f, "type": "video"} for f in base_item.get("source_files", [video_path])],
-                    "events": manual_events
-                }
-                
-                # 遵循原始结构添加 smart_events 字段（如果有的话）
-                if smart_events:
-                    out_item["smart_events"] = smart_events
-                    
-                items.append(out_item)
+            
 
     def _clear_workspace(self, full_reset=False):
         """
@@ -336,7 +335,7 @@ def _clear_workspace(self, full_reset=False):
             self.main.loc_manager.center_panel.media_preview.stop()
             self.main.loc_manager.center_panel.media_preview.player.setSource(QUrl())
 
-            # ✅ [FIX] Reset timeline UI (markers + label + slider)
+            # [FIX] Reset timeline UI (markers + label + slider)
             tl = self.main.loc_manager.center_panel.timeline
             tl.set_markers([])
             tl.set_duration(0)
@@ -345,6 +344,13 @@ def _clear_workspace(self, full_reset=False):
             # Right panel: clear table and schema
             self.main.loc_manager.right_panel.table.set_data([])
             self.main.loc_manager.right_panel.annot_mgmt.update_schema({})
+            if hasattr(self.main.loc_manager.right_panel, "smart_widget"):
+                smart_ui = self.main.loc_manager.right_panel.smart_widget
+                
+                smart_ui.reset_ui()
+                
+                smart_ui.predicted_table.set_data([])
+                smart_ui.confirmed_table.set_data([])
 
         # Reset model data
         self.model.reset(full_reset)
 
@@ -22,13 +22,38 @@ def __init__(self, video_path, start_ms, end_ms, config_path):
 
     def run(self):
         try:
+            import torch
+            if not torch.cuda.is_available():
+                torch.cuda.FloatTensor = torch.FloatTensor
+                torch.cuda.LongTensor = torch.LongTensor
+                torch.cuda.IntTensor = torch.IntTensor
+                torch.cuda.DoubleTensor = torch.DoubleTensor
+            # ==========================================
+            
             # Import library inside thread to avoid blocking main thread at startup
             from opensportslib import model
+            import subprocess
 
             with tempfile.TemporaryDirectory() as tmp_dir:
+                # Use FFmpeg to cut clips
+                clip_video_path = os.path.join(tmp_dir, "clipped_segment.mp4")
+                
+                def ms_to_ffmpeg(ms):
+                    s = ms // 1000
+                    return f"{s // 3600:02}:{(s % 3600) // 60:02}:{s % 60:02}.{ms % 1000:03}"
+
+                start_time_str = ms_to_ffmpeg(self.start_ms)
+                duration_ms = self.end_ms - self.start_ms if self.end_ms > 0 else 0
+                
+                cmd = ['ffmpeg', '-y', '-ss', start_time_str, '-i', self.video_path]
+                if duration_ms > 0:
+                    cmd += ['-t', ms_to_ffmpeg(duration_ms)]
+                cmd += ['-c', 'copy', clip_video_path]
+                
+                subprocess.run(cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, check=True)
+
                 tmp_input_json = os.path.join(tmp_dir, "temp_test.json")
                 tmp_config_yaml = os.path.join(tmp_dir, "temp_config.yaml")
-                tmp_output_json = os.path.join(tmp_dir, "predictions.json")
 
                 # --- 1. Load and dynamically patch the YAML config ---
                 with open(self.config_path, 'r', encoding='utf-8') as f:
@@ -37,34 +62,35 @@ def run(self):
                 classes = config_dict.get("DATA", {}).get("classes", [])
 
                 # 🚀 [MAC CPU ADAPTATION & PATH FIXES] 🚀
-                # Force CPU mode and disable Multi-GPU dynamically
                 if "SYSTEM" not in config_dict: config_dict["SYSTEM"] = {}
                 config_dict["SYSTEM"]["work_dir"] = tmp_dir
                 config_dict["SYSTEM"]["device"] = "cpu"
-                config_dict["SYSTEM"]["GPU"] = 0
-                config_dict["SYSTEM"]["gpu_id"] = 0
+                config_dict["SYSTEM"]["GPU"] = -1
+                config_dict["SYSTEM"]["gpu_id"] = -1
 
                 if "MODEL" not in config_dict: config_dict["MODEL"] = {}
                 config_dict["MODEL"]["multi_gpu"] = False
-                
-                # Override dataloader paths for test
+
                 if "DATA" in config_dict and "test" in config_dict["DATA"]:
-                    config_dict["DATA"]["test"]["video_path"] = os.path.dirname(self.video_path)
+                    config_dict["DATA"]["test"]["video_path"] = tmp_dir 
                     config_dict["DATA"]["test"]["path"] = tmp_input_json
                     config_dict["DATA"]["test"]["results"] = "predictions"
-                
+                    
+                if "dataloader" not in config_dict["DATA"]["test"]:
+                    config_dict["DATA"]["test"]["dataloader"] = {}
+                config_dict["DATA"]["test"]["dataloader"]["pin_memory"] = False
+
                 with open(tmp_config_yaml, 'w', encoding='utf-8') as f:
                     yaml.dump(config_dict, f)
 
-                # --- 2. Create temporary JSON for the single video ---
+                # --- 2. Create temporary JSON for the clipped video ---
                 test_data = {
                     "version": "2.0",
                     "task": "action_spotting",
                     "labels": {"ball_action": {"type": "single_label", "labels": classes}},
                     "data": [{
                         "id": "inf_vid",
-                        "inputs": [{"path": self.video_path, "type": "video", "fps": 25.0}],
-                        # 必须放一个 Dummy event 骗过 DataLoader
+                        "inputs": [{"path": clip_video_path, "type": "video", "fps": 25.0}],
                         "events": [{"head": "ball_action", "label": classes[0] if classes else "Unknown", "position_ms": 0}]
                     }]
                 }
@@ -75,34 +101,29 @@ def run(self):
                 loc_model = model.localization(config=tmp_config_yaml)
 
                 try:
-                    # 运行推理。这里一定会抛出 FileNotFoundError，因为框架底层的评估器找不到文件
                     loc_model.infer(
                         test_set=tmp_input_json, 
                         pretrained="jeetv/snpro-snbas-2024"
                     )
-                except FileNotFoundError:
-                    # [关键修复 4]：霸气忽略！
-                    # 因为报错发生在推理完成之后的“评估阶段”，所以我们直接 catch 掉这个错误，
-                    # 假装无事发生，直接进入下一步去深层文件夹里捞生成的 JSON。
+
+                except Exception as eval_err:
+                    print(f"Ignored evaluation error: {eval_err}")
                     pass
 
-                # --- 4. Parse result JSON ---
-                # 递归搜索临时文件夹下的所有 .json 文件（完美穿透 checkpoints/xxx 嵌套文件夹）
+                # --- 4. Parse result JSON and compensate timestamps ---
                 search_pattern = os.path.join(tmp_dir, "**", "*.json")
                 all_jsons = glob.glob(search_pattern, recursive=True)
 
                 valid_preds = []
                 for f in all_jsons:
                     filename = os.path.basename(f)
-                    # 排除掉我们自己生成的输入数据和配置文件
                     if "temp_test" not in filename and "temp_config" not in filename:
                         valid_preds.append(f)
 
                 if valid_preds:
-                    # 找到最新生成的那一个（防止有多个旧文件干扰）
                     actual_output_json = max(valid_preds, key=os.path.getctime)
                 else:
-                    raise FileNotFoundError(f"Could not find any generated prediction JSON in {tmp_dir}/checkpoints/")
+                    raise FileNotFoundError(f"Could not find any generated prediction JSON in {tmp_dir}")
 
                 predicted_events = []
                 if os.path.exists(actual_output_json):
@@ -111,16 +132,20 @@ def run(self):
 
                     raw_evts = output_data.get("data", [{}])[0].get("events", [])
                     for evt in raw_evts:
-                        p_ms = int(evt.get("position_ms", 0))
+                        p_ms_relative = int(evt.get("position_ms", 0))
 
-                        if p_ms == 0 and evt.get("label") == (classes[0] if classes else "Unknown"):
+                        if p_ms_relative == 0 and evt.get("label") == (classes[0] if classes else "Unknown"):
                             continue
+                        p_ms_absolute = p_ms_relative + self.start_ms
 
-                        if p_ms >= self.start_ms and (self.end_ms == 0 or p_ms <= self.end_ms):
+                        if self.end_ms == 0 or p_ms_absolute <= self.end_ms:
+                            # Get confidence 
+                            conf = evt.get("confidence", evt.get("score", 0.99))
                             predicted_events.append({
-                                "head": evt.get("head", "ball_action"),
+                                "head": "ball_action",
                                 "label": evt.get("label", "Unknown"),
-                                "position_ms": p_ms
+                                "position_ms": p_ms_absolute,
+                                "confidence": conf 
                             })
 
                 self.finished_signal.emit(predicted_events)