Clean push: Removed heavy files & added only latest snapshot

2025-07-26 05:16:12 +05:30
commit acf84e8767
250 changed files with 58564 additions and 0 deletions
--- a/qt_app_pyside1/utils/embedder_openvino.py
+++ b/qt_app_pyside1/utils/embedder_openvino.py
@@ -0,0 +1,318 @@
+"""
+OpenVINO-based embedder for DeepSORT tracking.
+"""
+
+import os
+import numpy as np
+from pathlib import Path
+import cv2
+import time
+from typing import List, Optional, Union
+
+try:
+    import openvino as ov
+except ImportError:
+    print("Installing openvino...")
+    os.system('pip install --quiet "openvino>=2024.0.0"')
+    import openvino as ov
+
+class OpenVINOEmbedder:
+    """
+    OpenVINO embedder for DeepSORT tracking.
+    
+    This class provides an optimized version of the feature embedder used in DeepSORT,
+    using OpenVINO for inference acceleration.
+    """
+    def __init__(
+        self, 
+        model_path: Optional[str] = None, 
+        device: str = "AUTO",
+        input_size: tuple = (128, 64),
+        batch_size: int = 16,
+        bgr: bool = True,
+        half: bool = True
+    ):
+        """
+        Initialize the OpenVINO embedder.
+        
+        Args:
+            model_path: Path to the model file. If None, will use the default MobileNetV2 model.
+            device: Device to run inference on ('CPU', 'GPU', 'AUTO', etc.)
+            input_size: Input size for the model (height, width)
+            batch_size: Batch size for inference
+            bgr: Whether input images are BGR (True) or RGB (False)
+            half: Whether to use half precision (FP16)
+        """
+        self.device = device
+        self.input_size = input_size  # (h, w)
+        self.batch_size = batch_size
+        self.bgr = bgr
+        self.half = half
+        
+        # Initialize OpenVINO Core
+        self.core = ov.Core()
+        
+        # Find and load model
+        if model_path is None:
+            # Use MobileNetV2 converted to OpenVINO
+            model_path = self._find_mobilenet_model()
+            
+            # If model not found, convert it
+            if model_path is None:
+                print("⚠️ MobileNetV2 OpenVINO model not found. Creating it...")
+                model_path = self._convert_mobilenet()
+        else:
+            # When model_path is explicitly provided, verify it exists
+            if not os.path.exists(model_path):
+                print(f"⚠️ Specified model path does not exist: {model_path}")
+                print("Falling back to default model search...")
+                model_path = self._find_mobilenet_model()
+                if model_path is None:
+                    print("⚠️ Default model search also failed. Creating new model...")
+                    model_path = self._convert_mobilenet()
+            else:
+                print(f"✅ Using explicitly provided model: {model_path}")
+        
+        print(f"📦 Loading embedder model: {model_path} on {device}")
+        
+        # Load and compile the model
+        self.model = self.core.read_model(model_path)
+        
+        # Set up configuration for device
+        ov_config = {}
+        if device != "CPU":
+            self.model.reshape({0: [self.batch_size, 3, self.input_size[0], self.input_size[1]]})
+        if "GPU" in device or ("AUTO" in device and "GPU" in self.core.available_devices):
+            ov_config = {"GPU_DISABLE_WINOGRAD_CONVOLUTION": "YES"}
+            
+        # Compile model for the specified device
+        self.compiled_model = self.core.compile_model(model=self.model, device_name=self.device, config=ov_config)
+        
+        # Get input and output tensors
+        self.input_layer = self.compiled_model.inputs[0]
+        self.output_layer = self.compiled_model.outputs[0]
+        
+        # Create inference requests for async inference
+        self.infer_requests = [self.compiled_model.create_infer_request() for _ in range(2)]
+        self.current_request_idx = 0
+        
+        # Performance stats
+        self.total_inference_time = 0
+        self.inference_count = 0
+        
+    def _find_mobilenet_model(self) -> Optional[str]:
+        """
+        Find MobileNetV2 model converted to OpenVINO format.
+        
+        Returns:
+            Path to the model file or None if not found
+        """
+        search_paths = [
+            # Standard locations
+            "mobilenetv2_embedder/mobilenetv2.xml",
+            "../mobilenetv2_embedder/mobilenetv2.xml",
+            "../../mobilenetv2_embedder/mobilenetv2.xml",
+            # Look in models directory
+            "../models/mobilenetv2.xml",
+            "../../models/mobilenetv2.xml",
+            # Look relative to DeepSORT location
+            os.path.join(os.path.dirname(__file__), "models/mobilenetv2.xml"),
+            # Look in openvino_models
+            "../openvino_models/mobilenetv2.xml",
+            "../../openvino_models/mobilenetv2.xml"
+        ]
+        
+        for path in search_paths:
+            if os.path.exists(path):
+                return path
+                
+        return None
+        
+    def _convert_mobilenet(self) -> str:
+        """
+        Convert MobileNetV2 model to OpenVINO IR format.
+        
+        Returns:
+            Path to the converted model
+        """
+        try:
+            # Create directory for the model
+            output_dir = Path("mobilenetv2_embedder")
+            output_dir.mkdir(exist_ok=True)
+            
+            # First, we need to download the PyTorch model
+            import torch
+            import torch.nn as nn
+            from torchvision.models import mobilenet_v2, MobileNet_V2_Weights
+            
+            print("⬇️ Downloading MobileNetV2 model...")
+            model = mobilenet_v2(weights=MobileNet_V2_Weights.IMAGENET1K_V1)
+            
+            # Modify for feature extraction (remove classifier)
+            class FeatureExtractor(nn.Module):
+                def __init__(self, model):
+                    super(FeatureExtractor, self).__init__()
+                    self.features = nn.Sequential(*list(model.children())[:-1])
+                    
+                def forward(self, x):
+                    return self.features(x).squeeze()
+            
+            feature_model = FeatureExtractor(model)
+            feature_model.eval()
+            
+            # Save to ONNX
+            onnx_path = output_dir / "mobilenetv2.onnx"
+            print(f"💾 Converting to ONNX: {onnx_path}")
+            dummy_input = torch.randn(1, 3, self.input_size[0], self.input_size[1])
+            
+            torch.onnx.export(
+                feature_model,
+                dummy_input,
+                onnx_path,
+                input_names=["input"],
+                output_names=["output"],
+                dynamic_axes={"input": {0: "batch_size"}, "output": {0: "batch_size"}},
+                opset_version=11
+            )
+            
+            # Convert ONNX to OpenVINO IR
+            ir_path = output_dir / "mobilenetv2.xml"
+            print(f"💾 Converting to OpenVINO IR: {ir_path}")
+            
+            # Use the proper OpenVINO API to convert the model
+            try:
+                from openvino.tools.mo import convert_model
+                
+                print(f"Converting ONNX model using OpenVINO convert_model API...")
+                print(f"Input model: {onnx_path}")
+                print(f"Output directory: {output_dir}")
+                print(f"Input shape: [{self.batch_size},3,{self.input_size[0]},{self.input_size[1]}]")
+                print(f"Data type: {'FP16' if self.half else 'FP32'}")
+                
+                # Convert using the proper API
+                convert_model(
+                    model_path=str(onnx_path),
+                    output_dir=str(output_dir),
+                    input_shape=[self.batch_size, 3, self.input_size[0], self.input_size[1]],
+                    data_type="FP16" if self.half else "FP32"
+                )
+                
+                print(f"✅ Model successfully converted using OpenVINO convert_model API")
+            except Exception as e:
+                print(f"Error with convert_model: {e}, trying alternative approach...")
+                
+                # Fallback to subprocess with explicit path if needed
+                import subprocess
+                import sys
+                import os
+                
+                # Try to find mo.py in the OpenVINO installation
+                mo_paths = [
+                    os.path.join(os.environ.get("INTEL_OPENVINO_DIR", ""), "tools", "mo", "mo.py"),
+                    os.path.join(os.path.dirname(os.path.dirname(os.__file__)), "openvino", "tools", "mo", "mo.py"),
+                    "C:/Program Files (x86)/Intel/openvino_2021/tools/mo/mo.py",
+                    "C:/Program Files (x86)/Intel/openvino/tools/mo/mo.py"
+                ]
+                
+                mo_script = None
+                for path in mo_paths:
+                    if os.path.exists(path):
+                        mo_script = path
+                        break
+                
+                if not mo_script:
+                    raise FileNotFoundError("Cannot find OpenVINO Model Optimizer (mo.py)")
+                
+                cmd = [
+                    sys.executable,
+                    mo_script,
+                    "--input_model", str(onnx_path),
+                    "--output_dir", str(output_dir),
+                    "--input_shape", f"[{self.batch_size},3,{self.input_size[0]},{self.input_size[1]}]",
+                    "--data_type", "FP16" if self.half else "FP32"
+                ]
+                
+                print(f"Running Model Optimizer: {' '.join(cmd)}")
+                result = subprocess.run(cmd, capture_output=True, text=True)
+                
+                if result.returncode != 0:
+                    print(f"Error running Model Optimizer: {result.stderr}")
+                    raise RuntimeError(f"Model Optimizer failed: {result.stderr}")
+            
+            print(f"✅ Model converted: {ir_path}")
+            return str(ir_path)
+            
+        except Exception as e:
+            print(f"❌ Error converting model: {e}")
+            import traceback
+            traceback.print_exc()
+            return None
+            
+    def preprocess(self, crops: List[np.ndarray]) -> np.ndarray:
+        """
+        Preprocess image crops for model input.
+        
+        Args:
+            crops: List of image crops
+            
+        Returns:
+            Preprocessed batch tensor
+        """
+        processed = []
+        for crop in crops:
+            # Resize to expected input size
+            crop = cv2.resize(crop, (self.input_size[1], self.input_size[0]))
+            
+            # Convert BGR to RGB if needed
+            if not self.bgr and crop.shape[2] == 3:
+                crop = cv2.cvtColor(crop, cv2.COLOR_BGR2RGB)
+                
+            # Normalize (0-255 to 0-1)
+            crop = crop.astype(np.float32) / 255.0
+            
+            # Change to NCHW format
+            crop = crop.transpose(2, 0, 1)
+            processed.append(crop)
+            
+        # Stack into batch
+        batch = np.stack(processed)
+        return batch
+        
+    def __call__(self, crops: List[np.ndarray]) -> np.ndarray:
+        """
+        Get embeddings for the image crops.
+        
+        Args:
+            crops: List of image crops
+            
+        Returns:
+            Embeddings for each crop
+        """
+        if not crops:
+            return np.array([])
+            
+        # Preprocess crops
+        batch = self.preprocess(crops)
+        
+        # Run inference
+        start_time = time.time()
+        
+        # Use async inference to improve performance
+        request = self.infer_requests[self.current_request_idx]
+        self.current_request_idx = (self.current_request_idx + 1) % len(self.infer_requests)
+        
+        request.start_async({self.input_layer.any_name: batch})
+        request.wait()
+        
+        # Get output
+        embeddings = request.get_output_tensor().data
+        
+        # Track inference time
+        inference_time = time.time() - start_time
+        self.total_inference_time += inference_time
+        self.inference_count += 1
+        
+        # Normalize embeddings
+        embeddings = embeddings / np.linalg.norm(embeddings, axis=1, keepdims=True)
+        
+        return embeddings