2 месяцев назад · 26730944ea
--- a/demo_app.py
+++ b/demo_app.py
@@ -67,6 +67,20 @@ st.sidebar.slider(
 
															     on_change=update_confidence
														
 
															 )
														
 
															+st.sidebar.markdown("---")
														
 
															+st.sidebar.subheader("Inference Engine")
														
 
															+engine_choice = st.sidebar.selectbox(
														
 
															+    "Select Model Engine",
														
 
															+    ["YOLO26 (ONNX - High Speed)", "YOLO26 (PyTorch - Native)"],
														
 
															+    index=0,
														
 
															+    help="ONNX is optimized for latency. PyTorch provides native object handling."
														
 
															+)
														
 
															+model_type = "onnx" if "ONNX" in engine_choice else "pytorch"
														
 
															+if model_type == "pytorch":
														
 
															+    st.sidebar.warning("PyTorch Engine: Higher Memory Usage")
														
 
															+else:
														
 
															+    st.sidebar.info("ONNX Engine: ~39ms Latency")
														
 
															+
														
 
															 # Helper to reset results when files change
														
 
															 def reset_single_results():
														
 
															     st.session_state.last_detection = None
														
@@ -291,9 +305,10 @@ with tab1:
 
															         # 1. Auto-Detection Trigger
														
 
															         if uploaded_file and st.session_state.last_detection is None:
														
 
															-            with st.spinner("Processing Detections Locally..."):
														
 
															+            with st.spinner(f"Processing with {model_type.upper()} Engine..."):
														
 
															                 files = {"file": (uploaded_file.name, uploaded_file.getvalue(), uploaded_file.type)}
														
 
															-                res = requests.post(f"{API_BASE_URL}/analyze", files=files)
														
 
															+                payload = {"model_type": model_type}
														
 
															+                res = requests.post(f"{API_BASE_URL}/analyze", files=files, data=payload)
														
 
															                 if res.status_code == 200:
														
 
															                     st.session_state.last_detection = res.json()
														
 
															                     st.rerun() # Refresh to show results immediately
														
@@ -530,9 +545,10 @@ with tab2:
 
															         st.write("##") # Alignment
														
 
															         if st.session_state.last_batch_results is None and uploaded_files:
														
 
															             if st.button("🔍 Process Batch", type="primary", width='stretch'):
														
 
															-                with st.spinner(f"Analyzing {len(uploaded_files)} images..."):
														
 
															+                with st.spinner(f"Analyzing {len(uploaded_files)} images with {model_type.upper()}..."):
														
 
															                     files = [("files", (f.name, f.getvalue(), f.type)) for f in uploaded_files]
														
 
															-                    res = requests.post(f"{API_BASE_URL}/process_batch", files=files)
														
 
															+                    payload = {"model_type": model_type}
														
 
															+                    res = requests.post(f"{API_BASE_URL}/process_batch", files=files, data=payload)
														
 
															                     if res.status_code == 200:
														
 
															                         data = res.json()
														
--- a/src/api/main.py
+++ b/src/api/main.py
@@ -4,6 +4,7 @@ import os
 
															 import shutil
														
 
															 from fastapi import FastAPI, File, UploadFile, Body, Form, BackgroundTasks
														
 
															 import onnxruntime as ort
														
 
															+from ultralytics import YOLO
														
 
															 import numpy as np
														
 
															 from dotenv import load_dotenv
														
@@ -46,64 +47,67 @@ os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = "gemini-embedding-service-key.jso
 
															 app = FastAPI(title="Palm Oil Ripeness Service (DDD)")
														
 
															-# Initialize ONNX model
														
 
															-onnx_path = 'best.onnx'
														
 
															-ort_session = ort.InferenceSession(onnx_path)
														
 
															-input_name = ort_session.get_inputs()[0].name
														
 
															-class_names = {
														
 
															-    0: 'Empty_Bunch',
														
 
															-    1: 'Underripe',
														
 
															-    2: 'Abnormal',
														
 
															-    3: 'Ripe',
														
 
															-    4: 'Unripe',
														
 
															-    5: 'Overripe'
														
 
															-}
														
 
															-
														
 
															-def preprocess(img: Image.Image):
														
 
															-    """Preprocess image for YOLO ONNX input [1, 3, 640, 640]."""
														
 
															-    img = img.convert("RGB")
														
 
															-    # Store original size for scaling
														
 
															-    orig_w, orig_h = img.size
														
 
															-    img_resized = img.resize((640, 640))
														
 
															-    img_array = np.array(img_resized) / 255.0
														
 
															-    img_array = img_array.transpose(2, 0, 1) # HWC to CHW
														
 
															-    img_array = img_array.reshape(1, 3, 640, 640).astype(np.float32)
														
 
															-    return img_array, orig_w, orig_h
														
 
															-
														
 
															-def run_inference(img: Image.Image, conf_threshold: float):
														
 
															-    """Run ONNX inference and return list of detections."""
														
 
															-    img_array, orig_w, orig_h = preprocess(img)
														
 
															-    outputs = ort_session.run(None, {input_name: img_array})
														
 
															-    # Output shape: [1, 300, 6] -> [x1, y1, x2, y2, conf, class_id]
														
 
															-    detections_batch = outputs[0]
														
 
															-    
														
 
															-    scale_w = orig_w / 640.0
														
 
															-    scale_h = orig_h / 640.0
														
 
															-    
														
 
															-    detections = []
														
 
															-    valid_count = 0
														
 
															-    for i in range(detections_batch.shape[1]):
														
 
															-        det = detections_batch[0, i]
														
 
															-        conf = float(det[4])
														
 
															-        if conf >= conf_threshold:
														
 
															-            valid_count += 1
														
 
															-            x1, y1, x2, y2 = det[:4]
														
 
															-            # Rescale
														
 
															-            x1 *= scale_w
														
 
															-            y1 *= scale_h
														
 
															-            x2 *= scale_w
														
 
															-            y2 *= scale_h
														
 
															-            class_id = int(det[5])
														
 
															-            class_name = class_names.get(class_id, "Unknown")
														
 
															-            
														
 
															+class ModelManager:
														
 
															+    def __init__(self, onnx_path: str, pt_path: str):
														
 
															+        self.onnx_session = ort.InferenceSession(onnx_path)
														
 
															+        self.onnx_input_name = self.onnx_session.get_inputs()[0].name
														
 
															+        self.pt_model = YOLO(pt_path)
														
 
															+        self.class_names = self.pt_model.names
														
 
															+
														
 
															+    def preprocess_onnx(self, img: Image.Image):
														
 
															+        img = img.convert("RGB")
														
 
															+        orig_w, orig_h = img.size
														
 
															+        img_resized = img.resize((640, 640))
														
 
															+        img_array = np.array(img_resized) / 255.0
														
 
															+        img_array = img_array.transpose(2, 0, 1)
														
 
															+        img_array = img_array.reshape(1, 3, 640, 640).astype(np.float32)
														
 
															+        return img_array, orig_w, orig_h
														
 
															+
														
 
															+    def run_onnx_inference(self, img: Image.Image, conf_threshold: float):
														
 
															+        img_array, orig_w, orig_h = self.preprocess_onnx(img)
														
 
															+        outputs = self.onnx_session.run(None, {self.onnx_input_name: img_array})
														
 
															+        detections_batch = outputs[0]
														
 
															+        
														
 
															+        scale_w = orig_w / 640.0
														
 
															+        scale_h = orig_h / 640.0
														
 
															+        
														
 
															+        detections = []
														
 
															+        valid_count = 0
														
 
															+        for i in range(detections_batch.shape[1]):
														
 
															+            det = detections_batch[0, i]
														
 
															+            conf = float(det[4])
														
 
															+            if conf >= conf_threshold:
														
 
															+                valid_count += 1
														
 
															+                x1, y1, x2, y2 = det[:4]
														
 
															+                x1 *= scale_w; y1 *= scale_h; x2 *= scale_w; y2 *= scale_h
														
 
															+                class_id = int(det[5])
														
 
															+                class_name = self.class_names.get(class_id, "Unknown")
														
 
															+                
														
 
															+                detections.append({
														
 
															+                    "bunch_id": valid_count,
														
 
															+                    "class": class_name,
														
 
															+                    "confidence": round(conf, 2),
														
 
															+                    "is_health_alert": class_name in ["Abnormal", "Empty_Bunch"],
														
 
															+                    "box": [float(x1), float(y1), float(x2), float(y2)]
														
 
															+                })
														
 
															+        return detections
														
 
															+
														
 
															+    def run_pytorch_inference(self, img: Image.Image, conf_threshold: float):
														
 
															+        results = self.pt_model(img, conf=conf_threshold, verbose=False)
														
 
															+        detections = []
														
 
															+        for i, box in enumerate(results[0].boxes):
														
 
															+            class_id = int(box.cls)
														
 
															+            class_name = self.class_names.get(class_id, "Unknown")
														
 
															             detections.append({
														
 
															-                "bunch_id": valid_count,
														
 
															+                "bunch_id": i + 1,
														
 
															                 "class": class_name,
														
 
															-                "confidence": round(conf, 2),
														
 
															+                "confidence": round(float(box.conf), 2),
														
 
															                 "is_health_alert": class_name in ["Abnormal", "Empty_Bunch"],
														
 
															-                "box": [float(x1), float(y1), float(x2), float(y2)]
														
 
															+                "box": box.xyxy.tolist()[0]
														
 
															             })
														
 
															-    return detections
														
 
															+        return detections
														
 
															+
														
 
															+model_manager = ModelManager(onnx_path='best.onnx', pt_path='best.pt')
														
 
															 # Global state for the confidence threshold
														
@@ -146,17 +150,19 @@ async def set_confidence(threshold: float = Body(..., embed=True)):
 
															 @app.post("/analyze")
														
 
															-async def analyze_with_health_metrics(file: UploadFile = File(...)):
														
 
															+async def analyze_with_health_metrics(file: UploadFile = File(...), model_type: str = Form("onnx")):
														
 
															     """Industry-grade analysis with health metrics and summary."""
														
 
															     image_bytes = await file.read()
														
 
															     img = Image.open(io.BytesIO(image_bytes))
														
 
															-    # Run ONNX inference (natively NMS-free)
														
 
															-    detections = run_inference(img, current_conf)
														
 
															-    
														
 
															-    # Initialize summary for all known classes
														
 
															-    summary = {name: 0 for name in class_names.values()}
														
 
															+    # Select Inference Engine
														
 
															+    if model_type == "pytorch":
														
 
															+        detections = model_manager.run_pytorch_inference(img, current_conf)
														
 
															+    else:
														
 
															+        detections = model_manager.run_onnx_inference(img, current_conf)
														
 
															+    # Initialize summary
														
 
															+    summary = {name: 0 for name in model_manager.class_names.values()}
														
 
															     for det in detections:
														
 
															         summary[det['class']] += 1
														
@@ -220,8 +226,8 @@ async def vectorize_and_store(file: UploadFile = File(...), detection_data: str
 
															             os.remove(temp_path)
														
 
															 @app.post("/process_batch")
														
 
															-async def process_batch(files: List[UploadFile] = File(...)):
														
 
															-    """Handles multiple images: Detect -> Vectorize -> Store. Graceful handling of cloud errors."""
														
 
															+async def process_batch(files: List[UploadFile] = File(...), model_type: str = Form("onnx")):
														
 
															+    """Handles multiple images: Detect -> Vectorize -> Store."""
														
 
															     batch_results = []
														
 
															     temp_files = []
														
@@ -234,9 +240,12 @@ async def process_batch(files: List[UploadFile] = File(...)):
 
															                 shutil.copyfileobj(file.file, f_out)
														
 
															             temp_files.append(path)
														
 
															-            # 2. ONNX Detect (natively NMS-free)
														
 
															+            # 2. Detect
														
 
															             img = Image.open(path)
														
 
															-            detections = run_inference(img, current_conf)
														
 
															+            if model_type == "pytorch":
														
 
															+                detections = model_manager.run_pytorch_inference(img, current_conf)
														
 
															+            else:
														
 
															+                detections = model_manager.run_onnx_inference(img, current_conf)
														
 
															             # 3. Process all detections in the image
														
 
															             for det in detections: