5: readme

4: debugging flag
3
2026-01-01 11:39:26 +01:00 · 2026-01-01 11:28:57 +01:00 · 2026-01-01 11:20:05 +01:00 · 2026-01-01 10:07:37 +01:00 · 2026-01-01 09:53:11 +01:00
4 changed files with 583 additions and 203 deletions
--- a/pycache/inference.cpython-311.pyc
+++ b/pycache/inference.cpython-311.pyc
--- a/app.py
+++ b/app.py
@ -1,51 +1,122 @@
+import base64
+import json
 import logging
 import sys
-import os
 import threading
-import json
 import time
 import traceback
-import base64

 import cv2
 import numpy as np
 import paho.mqtt.client as mqtt
-from flask import Flask, render_template, jsonify, request, Response
+from flask import Flask, Response, jsonify, render_template, request

-# test
-# Import Config, Manager, and NEW Inference Worker
 from config import Config
-from manager import CameraManager
 from inference import InferenceWorker
+from manager import CameraManager

-# --- Logging Setup ---
+# ------------------------------------------------------------------------------
+# 1. USER CONFIGURATION (Edit these values here)
+# ------------------------------------------------------------------------------
+
+# Enable verbose debug logs (True = verbose, False = quiet/crucial only)
+DEBUG_LOG = False
+
+# Rate Limiting: How many seconds to wait between detections per camera
+DETECTION_INTERVAL = 10
+
+# Frame Quality Threshold: Skip images with standard deviation lower than this.
+# - Low values (1-5) allow darker/low-contrast images (good for night).
+# - High values (20-40) filter out gray/blank screens but might skip valid dark images.
+# - Set to 0 to disable this check entirely.
+FRAME_STD_THRESHOLD = 1.0
+
+# ------------------------------------------------------------------------------
+
+
+def _cfg(*names, default=None):
+    """Return first matching attribute from Config, else default."""
+    for n in names:
+        if hasattr(Config, n):
+            return getattr(Config, n)
+    return default
+
+
+# --- Logging setup ---
+LOG_LEVEL = logging.DEBUG if DEBUG_LOG else _cfg("LOG_LEVEL", "LOGLEVEL", default=logging.INFO)
 logging.basicConfig(
-    level=Config.LOG_LEVEL,
+    level=LOG_LEVEL,
    format='%(asctime)s [%(levelname)s] %(message)s',
-    handlers=[logging.StreamHandler(sys.stdout)]
+    handlers=[logging.StreamHandler(sys.stdout)],
 )
 logger = logging.getLogger(__name__)

 app = Flask(__name__)

-# --- Initialize Components ---
+# --- Initialize components ---
 camera_manager = CameraManager()
-inference_worker = InferenceWorker() # <--- NEW
-inference_worker.start()             # <--- Start the background thread
+inference_worker = InferenceWorker(debug_log=DEBUG_LOG)
+inference_worker.start()

-# --- MQTT Setup ---
+# --- MQTT setup ---
 mqtt_client = mqtt.Client()
-if Config.MQTT_USERNAME and Config.MQTT_PASSWORD:
-    mqtt_client.username_pw_set(Config.MQTT_USERNAME, Config.MQTT_PASSWORD)
+
+MQTT_USERNAME = _cfg("MQTT_USERNAME", "MQTTUSERNAME", default=None)
+MQTT_PASSWORD = _cfg("MQTT_PASSWORD", "MQTTPASSWORD", default=None)
+MQTT_BROKER = _cfg("MQTT_BROKER", "MQTTBROKER", default="127.0.0.1")
+MQTT_PORT = int(_cfg("MQTT_PORT", "MQTTPORT", default=1883))
+MQTT_TOPIC = _cfg("MQTT_TOPIC", "MQTTTOPIC", default="homeassistant/sensor/RTSPCamDigitDetection/state")
+
+if MQTT_USERNAME and MQTT_PASSWORD:
+    mqtt_client.username_pw_set(MQTT_USERNAME, MQTT_PASSWORD)

 try:
-    mqtt_client.connect(Config.MQTT_BROKER, Config.MQTT_PORT, 60)
-    mqtt_client.loop_start() # START THE LOOP HERE
-    logger.info(f"Connected to MQTT Broker at {Config.MQTT_BROKER}:{Config.MQTT_PORT}")
+    mqtt_client.connect(MQTT_BROKER, MQTT_PORT, 60)
+    mqtt_client.loop_start()
+    logger.info("Connected to MQTT Broker at %s:%s", MQTT_BROKER, MQTT_PORT)
 except Exception as e:
-    logger.error(f"Failed to connect to MQTT Broker: {e}")
+    logger.error("Failed to connect to MQTT Broker: %s", e)
+
+
+# --- Helpers ---
+_last_log = {}
+
+def log_rl(level, key, msg, every_s=10):
+    """Rate-limited log. Use for noisy conditions."""
+    now = time.time()
+    last = _last_log.get(key, 0.0)
+    if now - last >= every_s:
+        _last_log[key] = now
+        logger.log(level, msg)
+
+
+def log_debug(key, msg, every_s=0):
+    """Debug-only logging with optional rate limiting."""
+    if not DEBUG_LOG:
+        return
+    if every_s and every_s > 0:
+        log_rl(logging.DEBUG, key, msg, every_s=every_s)
+    else:
+        logger.debug(msg)
+
+
+def log_condition(camera_id: str, cond_key: str, msg: str, *, crucial=False,
+                  debug_level=logging.DEBUG, debug_every=5,
+                  nodebug_level=logging.WARNING, nodebug_every=60):
+    """Log conditions (skip reasons, degraded state) without spamming.
+
+    - If DEBUG_LOG=True -> frequent detailed logs.
+    - If DEBUG_LOG=False -> only rate-limited warnings for crucial conditions.
+    """
+    key = f"{camera_id}:{cond_key}"
+    if DEBUG_LOG:
+        log_rl(debug_level, key, msg, every_s=debug_every)
+        return
+
+    if crucial:
+        log_rl(nodebug_level, key, msg, every_s=nodebug_every)
+

-# --- Helper Functions (UI Only) ---
 def crop_image_for_ui(image, roi_list, scaleX, scaleY):
    """Helper for the /crop endpoint (UI preview only)."""
    cropped_images = []
@ -62,100 +133,162 @@ def crop_image_for_ui(image, roi_list, scaleX, scaleY):
            pass
    return cropped_images

-def publish_detected_number(camera_id, detected_number):
-    """Publish result to MQTT."""
-    topic = f"{Config.MQTT_TOPIC}/{camera_id}"
-    payload = json.dumps({"value": detected_number})
+
+def publish_detected_number(camera_id, detected_number, confidence=None):
+    """Publish result to MQTT with optional confidence score."""
+    topic = f"{MQTT_TOPIC}/{camera_id}"
+
+    payload_dict = {"value": detected_number}
+    if confidence is not None:
+        payload_dict["confidence"] = round(float(confidence), 2)
+
+    payload = json.dumps(payload_dict)
+
    try:
        mqtt_client.publish(topic, payload)
-        logger.info(f"Published to {topic}: {detected_number}")
+        # Keep this INFO even when debug is off: it's the primary business output.
+        log_msg = f"Published to {topic}: {detected_number}"
+        if confidence is not None:
+            log_msg += f" (Conf: {confidence:.2f})"
+        logger.info(log_msg)
    except Exception as e:
-        logger.error(f"MQTT Publish failed: {e}")
+        logger.error("MQTT Publish failed: %s", e)

-# --- Main Processing Loop (Refactored) ---
-# Add this global dictionary at the top of app.py (near other globals)
+
+# --- Main processing loop ---
 last_processed_time = {}

-# Update process_all_cameras function
 def process_all_cameras():
-    """
-    Revised Loop with Rate Limiting
-    """
-    # Configurable interval (seconds)
-    DETECTION_INTERVAL = 10
+    hb_last = 0.0

    while True:
        try:
-            # --- Part 1: Process Results ---
+            # Heartbeat only in debug mode
+            if DEBUG_LOG:
+                now = time.time()
+                if now - hb_last >= 5.0:
+                    hb_last = now
+                    in_q = getattr(inference_worker, "input_queue", None)
+                    out_q = getattr(inference_worker, "result_queue", None)
+                    logger.info(
+                        "HB mainloop alive; in_q=%s out_q=%s dropped=%s processed=%s last_invoke_s=%s",
+                        (in_q.qsize() if in_q else "n/a"),
+                        (out_q.qsize() if out_q else "n/a"),
+                        getattr(inference_worker, "dropped_tasks", "n/a"),
+                        getattr(inference_worker, "processed_tasks", "n/a"),
+                        getattr(inference_worker, "last_invoke_secs", "n/a"),
+                    )
+
+            # --- Part 1: process results ---
            while True:
                result = inference_worker.get_result()
                if not result:
                    break

-                cam_id = result['camera_id']
-                val = result['value']
+                cam_id = result.get('camera_id')

-                camera_manager.results[cam_id] = val
-                publish_detected_number(cam_id, val)
+                # Debug-only latency trace
+                if DEBUG_LOG and result.get("task_ts") is not None:
+                    try:
+                        age = time.time() - float(result["task_ts"])
+                        logger.info(
+                            "Result cam=%s type=%s task_id=%s age_s=%.3f timing=%s",
+                            cam_id,
+                            result.get("type"),
+                            result.get("task_id"),
+                            age,
+                            result.get("timing_s"),
+                        )
+                    except Exception:
+                        pass

-            # --- Part 2: Feed Frames ---
+                if result.get('type') == 'success':
+                    val = result['value']
+                    conf = result.get('confidence')
+                    camera_manager.results[cam_id] = val
+                    publish_detected_number(cam_id, val, conf)
+
+                elif result.get('type') == 'error':
+                    msg = result.get('message', 'Unknown error')
+
+                    # When debug is off, avoid spamming "Low confidence" messages.
+                    if DEBUG_LOG:
+                        logger.warning("[%s] Detection skipped: %s", cam_id, msg)
+                    else:
+                        # Crucial errors: rate-limited warnings.
+                        # Filter out "Low confidence" unless it's crucial for you.
+                        if not str(msg).lower().startswith("low confidence"):
+                            log_condition(cam_id, "detect_error", f"[{cam_id}] Detection skipped: {msg}", crucial=True)
+
+            # --- Part 2: feed frames ---
            camera_manager.load_roi_config()

            for camera_id, camera_data in camera_manager.cameras.items():
                if not camera_data.get("active", True):
                    continue

-                # RATE LIMIT CHECK
                current_time = time.time()
-                last_time = last_processed_time.get(camera_id, 0)
+                last_time = last_processed_time.get(camera_id, 0.0)

                if current_time - last_time < DETECTION_INTERVAL:
-                    continue # Skip this camera, it's too soon
+                    log_debug(f"{camera_id}:rate", f"[{camera_id}] skip: rate limit", every_s=30)
+                    continue

                stream = camera_data.get("stream")
-                if not stream: continue
+                if not stream:
+                    log_condition(camera_id, "nostream", f"[{camera_id}] skip: no stream", crucial=True)
+                    continue

-                # Warmup Check
-                if (current_time - stream.start_time) < 5:
+                start_time = getattr(stream, "start_time", getattr(stream, "starttime", None))
+                if start_time is not None and (current_time - start_time) < 5:
+                    log_debug(f"{camera_id}:warmup", f"[{camera_id}] skip: warmup", every_s=10)
                    continue

                frame = stream.read()
-                
                if frame is None:
+                    log_condition(camera_id, "noframe", f"[{camera_id}] skip: frame is None", crucial=True)
                    continue

-                if np.std(frame) < 10:
+                # STD Check
+                frame_std = float(np.std(frame))
+                if frame_std < FRAME_STD_THRESHOLD:
+                    log_condition(
+                        camera_id,
+                        "lowstd",
+                        f"[{camera_id}] skip: low frame std={frame_std:.2f} (<{FRAME_STD_THRESHOLD})",
+                        crucial=True,
+                        debug_every=5,
+                        nodebug_every=60,
+                    )
                    continue

                roi_list = camera_manager.rois.get(camera_id, [])
                if not roi_list:
+                    log_condition(camera_id, "norois", f"[{camera_id}] skip: no ROIs configured", crucial=True)
                    continue

-                # SEND TO WORKER
-                inference_worker.add_task(camera_id, roi_list, frame)
-                
-                # Update last processed time
+                inference_worker.add_task(camera_id, roi_list, frame, frame_std=frame_std)
                last_processed_time[camera_id] = current_time

-            # Sleep briefly to prevent CPU spinning, but keep it responsive for results
            time.sleep(0.1)

        except Exception as e:
-            logger.error(f"Global process loop error: {e}")
+            logger.error("Global process loop error: %s", e)
            traceback.print_exc()
            time.sleep(5)


-# --- Flask Routes (Unchanged logic, just imports) ---
-
+# --- Flask routes ---
@app.route('/')
 def index():
    return render_template('index.html')

+
@app.route('/cameras', methods=['GET'])
 def get_cameras():
    return jsonify(camera_manager.get_camera_list())

+
@app.route('/video/<camera_id>')
 def video_feed(camera_id):
    def generate():
@ -164,11 +297,16 @@ def video_feed(camera_id):
            if frame is not None:
                ret, jpeg = cv2.imencode('.jpg', frame)
                if ret:
-                    yield (b'--frame\r\n' b'Content-Type: image/jpeg\r\n\r\n' + jpeg.tobytes() + b'\r\n\r\n')
+                    yield (
+                        b'--frame\r\n'
+                        b'Content-Type: image/jpeg\r\n\r\n' + jpeg.tobytes() + b'\r\n\r\n'
+                    )
            else:
                time.sleep(0.1)
+
    return Response(generate(), mimetype='multipart/x-mixed-replace; boundary=frame')

+
@app.route('/snapshot/<camera_id>')
 def snapshot(camera_id):
    frame = camera_manager.get_frame(camera_id)
@ -178,27 +316,29 @@ def snapshot(camera_id):
            return Response(jpeg.tobytes(), mimetype='image/jpeg')
    return 'No frame available', 404

+
@app.route('/rois/<camera_id>', methods=['GET'])
 def get_rois(camera_id):
-    # ... (Same logic as Step 3, just ensure it uses camera_manager) ...
    try:
        camera_manager.load_roi_config()
        all_rois = camera_manager.rois
+
        img_width = request.args.get("img_width", type=float)
        img_height = request.args.get("img_height", type=float)

        if not img_width or not img_height:
-             return jsonify(all_rois.get(camera_id, []))
+            return jsonify(all_rois.get(camera_id, []))

        cam = camera_manager.cameras.get(camera_id)
        if cam and cam.get("stream"):
            real_w = cam["stream"].width or cam["width"]
            real_h = cam["stream"].height or cam["height"]
        else:
-             return jsonify({"error": "Camera not ready"}), 500
+            return jsonify({"error": "Camera not ready"}), 500

        scaleX = img_width / real_w
        scaleY = img_height / real_h
+
        scaled_rois = []
        for roi in all_rois.get(camera_id, []):
            scaled_rois.append({
@ -207,29 +347,34 @@ def get_rois(camera_id):
                "y": int(round(roi["y"] * scaleY)),
                "width": int(round(roi["width"] * scaleX)),
                "height": int(round(roi["height"] * scaleY)),
-                "angle": roi["angle"]
+                "angle": roi.get("angle", 0),
            })
+
        return jsonify(scaled_rois)
+
    except Exception as e:
        return jsonify({"error": str(e)}), 500

+
@app.route("/save_rois", methods=["POST"])
 def save_rois_api():
-    # ... (Same logic as Step 3) ...
    data = request.json
+
    camera_id = data.get("camera_id")
    new_rois = data.get("rois")
    img_width = data.get("img_width")
    img_height = data.get("img_height")

-    if not camera_id or new_rois is None: return jsonify({"success": False})
+    if not camera_id or new_rois is None:
+        return jsonify({"success": False})

    cam = camera_manager.cameras.get(camera_id)
-    if not cam: return jsonify({"success": False})
+    if not cam:
+        return jsonify({"success": False})

    stream = cam.get("stream")
-    real_w = stream.width if stream and stream.width else cam["width"]
-    real_h = stream.height if stream and stream.height else cam["height"]
+    real_w = stream.width if stream and getattr(stream, "width", None) else cam["width"]
+    real_h = stream.height if stream and getattr(stream, "height", None) else cam["height"]

    scaleX = real_w / img_width if img_width else 1
    scaleY = real_h / img_height if img_height else 1
@ -242,24 +387,26 @@ def save_rois_api():
            "y": int(round(roi["y"] * scaleY)),
            "width": int(round(roi["width"] * scaleX)),
            "height": int(round(roi["height"] * scaleY)),
-            "angle": roi["angle"]
+            "angle": roi.get("angle", 0),
        })
+
    camera_manager.rois[camera_id] = scaled_rois
    return jsonify(camera_manager.save_roi_config())

+
@app.route('/crop', methods=['POST'])
 def crop():
-    # Helper for UI
    data = request.json
+
    camera_id = data.get('camera_id')
    scaleX = data.get('scaleX', 1)
    scaleY = data.get('scaleY', 1)

    frame = camera_manager.get_frame(camera_id)
-    if frame is None: return jsonify({'error': 'No frame'}), 500
+    if frame is None:
+        return jsonify({'error': 'No frame'}), 500

    roi_list = camera_manager.rois.get(camera_id, [])
-    # Use the local UI helper function
    cropped_images = crop_image_for_ui(frame, roi_list, scaleX, scaleY)

    cropped_base64_list = []
@ -267,67 +414,81 @@ def crop():
        ret, buffer = cv2.imencode('.jpg', cropped_img)
        if ret:
            cropped_base64_list.append(base64.b64encode(buffer).decode('utf-8'))
+
    return jsonify({'cropped_images': cropped_base64_list})

+
@app.route('/detect_digits', methods=['POST'])
 def detect_digits():
-    """Manual trigger: Runs inference immediately and returns result."""
+    """Manual trigger: Runs inference immediately and returns result with validation."""
    data = request.json
-    camera_id = data.get('camera_id')

+    camera_id = data.get('camera_id')
    if not camera_id:
        return jsonify({'error': 'Invalid camera ID'}), 400

-    # 1. Get Frame
    frame = camera_manager.get_frame(camera_id)
    if frame is None:
        return jsonify({'error': 'Failed to capture image'}), 500

-    # 2. Get ROIs
    roi_list = camera_manager.rois.get(camera_id, [])
    if not roi_list:
        return jsonify({'error': 'No ROIs defined'}), 400

-    # 3. Crop (Using the UI helper is fine here)
    cropped_images = crop_image_for_ui(frame, roi_list, scaleX=1, scaleY=1)
    if not cropped_images:
        return jsonify({'error': 'Failed to crop ROIs'}), 500

-    # 4. Run Inference Synchronously
-    # Note: We access the worker directly. 
-    # Thread safety: 'predict_batch' uses 'self.interpreter'. 
-    # If the background thread is also using it, TFLite might complain or crash.
-    # PROPER FIX: Pause the worker or use a Lock.
-    
-    # Since adding a Lock is complex now, a simple hack is to just add it to the queue
-    # and WAIT for the result? No, that's hard to correlate.
-    
-    # SAFE APPROACH: Use a Lock in InferenceWorker.
-    # For now, let's assume TFLite is robust enough or race conditions are rare for manual clicks.
-    # CALL THE PUBLIC METHOD:
    try:
-        detected_digits = inference_worker.predict_batch(cropped_images)
+        predictions = inference_worker.predict_batch(cropped_images)

-        valid_digits = [d for d in detected_digits if d.isdigit()]
+        valid_digits_str = []
+        confidences = []
+        rejected_reasons = []

-        if not valid_digits:
-            return jsonify({'error': 'No valid digits detected', 'raw': detected_digits}), 500
+        CONFIDENCE_THRESHOLD = inference_worker.CONFIDENCE_THRESHOLD
+        MIN_VALUE = inference_worker.MIN_VALUE
+        MAX_VALUE = inference_worker.MAX_VALUE

-        final_number = int("".join(valid_digits))
+        for i, p in enumerate(predictions):
+            if p['confidence'] < CONFIDENCE_THRESHOLD:
+                msg = f"Digit {i} ('{p['digit']}') rejected: conf {p['confidence']:.2f} < {CONFIDENCE_THRESHOLD}"
+                rejected_reasons.append(msg)
+                if DEBUG_LOG:
+                    logger.warning("[Manual] %s", msg)
+            else:
+                valid_digits_str.append(p['digit'])
+                confidences.append(p['confidence'])

-        # Publish and Update State
-        publish_detected_number(camera_id, final_number)
-        camera_manager.results[camera_id] = final_number
+        if len(valid_digits_str) != len(predictions):
+            return jsonify({'error': 'Low confidence detection', 'details': rejected_reasons, 'raw': predictions}), 400

-        logger.info(f"Manual detection for {camera_id}: {final_number}")
+        final_number_str = "".join(valid_digits_str)
+        try:
+            final_number = int(final_number_str)

-        return jsonify({
-            'detected_digits': valid_digits, 
-            'final_number': final_number
-        })
+            if not (MIN_VALUE <= final_number <= MAX_VALUE):
+                msg = f"Value {final_number} out of range ({MIN_VALUE}-{MAX_VALUE})"
+                if DEBUG_LOG:
+                    logger.warning("[Manual] %s", msg)
+                return jsonify({'error': 'Value out of range', 'value': final_number}), 400
+
+            avg_conf = float(np.mean(confidences)) if confidences else None
+            publish_detected_number(camera_id, final_number, avg_conf)
+            camera_manager.results[camera_id] = final_number
+
+            return jsonify({
+                'detected_digits': valid_digits_str,
+                'final_number': final_number,
+                'confidences': confidences,
+                'avg_confidence': avg_conf,
+            })
+
+        except ValueError:
+            return jsonify({'error': 'Could not parse digits', 'raw': valid_digits_str}), 500

    except Exception as e:
-        logger.error(f"Error during manual detection: {e}")
+        logger.error("Error during manual detection: %s", e)
        return jsonify({'error': str(e)}), 500


@ -337,13 +498,8 @@ def update_camera_config():
    success = camera_manager.update_camera_flip(data.get("camera_id"), data.get("flip_type"))
    return jsonify({"success": success})

-# --- Main ---
-if __name__ == '__main__':
-    # Threading:
-    # 1. Video Threads (in Manager)
-    # 2. Inference Thread (in Worker)
-    # 3. Main Loop (process_all_cameras - handles feeding)

+if __name__ == '__main__':
    t = threading.Thread(target=process_all_cameras, daemon=True)
    t.start()

--- a/inference.py
+++ b/inference.py
@ -1,63 +1,115 @@
-import threading
-import queue
-import time
 import logging
+import queue
+import threading
+import time
+
 import cv2
 import numpy as np
 import tflite_runtime.interpreter as tflite
+
 from config import Config

+# ------------------------------------------------------------------------------
+# 1. USER CONFIGURATION (Edit these values here)
+# ------------------------------------------------------------------------------
+
+# Minimum confidence (0-1) to accept a digit.
+# - Higher (0.85-0.90) reduces false positives like "1010" from noise.
+# - Lower (0.70-0.75) helps with weak/dark digits.
+CONFIDENCE_THRESHOLD = 0.1
+
+# Minimum and Maximum expected values for the number.
+MIN_VALUE = 5
+MAX_VALUE = 100
+
+# ------------------------------------------------------------------------------
+
 logger = logging.getLogger(__name__)

+def _cfg(*names, default=None):
+    for n in names:
+        if hasattr(Config, n):
+            return getattr(Config, n)
+    return default
+
+
 class InferenceWorker:
-    def __init__(self):
+    def __init__(self, debug_log: bool = False):
+        self.debug_log = bool(debug_log)
+
        self.input_queue = queue.Queue(maxsize=10)
        self.result_queue = queue.Queue()
        self.running = False
+
        self.interpreter = None
        self.input_details = None
        self.output_details = None
-
        self.lock = threading.Lock()

-        # Load Model
+        # Debug counters / telemetry
+        self.task_seq = 0
+        self.dropped_tasks = 0
+        self.processed_tasks = 0
+        self.last_invoke_secs = None
+
+        # Set thresholds from top-level variables
+        self.CONFIDENCE_THRESHOLD = CONFIDENCE_THRESHOLD
+        self.MIN_VALUE = MIN_VALUE
+        self.MAX_VALUE = MAX_VALUE
+
        self.load_model()

    def load_model(self):
        try:
-            logger.info(f"Loading TFLite model from: {Config.MODEL_PATH}")
-            self.interpreter = tflite.Interpreter(model_path=Config.MODEL_PATH)
+            model_path = _cfg("MODEL_PATH", "MODELPATH", default=None)
+            logger.info("Loading TFLite model from: %s", model_path)
+
+            self.interpreter = tflite.Interpreter(model_path=model_path)
            self.interpreter.allocate_tensors()
+
            self.input_details = self.interpreter.get_input_details()
            self.output_details = self.interpreter.get_output_details()

-            # Store original input shape for resizing logic
            self.original_input_shape = self.input_details[0]['shape']
-            logger.info(f"Model loaded. Default input shape: {self.original_input_shape}")
+            if self.debug_log:
+                logger.info("Model loaded. Default input shape: %s", self.original_input_shape)

        except Exception as e:
-            logger.critical(f"Failed to load TFLite model: {e}")
+            logger.critical("Failed to load TFLite model: %s", e)
            self.interpreter = None

    def start(self):
-        if self.running: return
+        if self.running:
+            return
        self.running = True
        threading.Thread(target=self._worker_loop, daemon=True).start()
        logger.info("Inference worker started.")

-    def add_task(self, camera_id, rois, frame):
+    def add_task(self, camera_id, rois, frame, frame_std=None):
        """Add task (non-blocking)."""
-        if not self.interpreter: return
+        if not self.interpreter:
+            return
+
+        self.task_seq += 1
+        task = {
+            'camera_id': camera_id,
+            'rois': rois,
+            'frame': frame,
+            'timestamp': time.time(),
+            'task_id': self.task_seq,
+            'frame_std': frame_std,
+        }
+
        try:
-            task = {
-                'camera_id': camera_id,
-                'rois': rois,
-                'frame': frame,
-                'timestamp': time.time()
-            }
            self.input_queue.put(task, block=False)
        except queue.Full:
-            pass
+            self.dropped_tasks += 1
+            logger.warning(
+                "add_task drop cam=%s qsize=%d dropped=%d",
+                camera_id,
+                self.input_queue.qsize(),
+                self.dropped_tasks,
+            )

    def get_result(self):
        try:
@ -65,6 +117,12 @@ class InferenceWorker:
        except queue.Empty:
            return None

+    def _put_result(self, d):
+        try:
+            self.result_queue.put(d, block=False)
+        except Exception:
+            logger.exception("Failed to enqueue result")
+
    def _worker_loop(self):
        while self.running:
            try:
@ -75,35 +133,133 @@ class InferenceWorker:
            cam_id = task['camera_id']
            rois = task['rois']
            frame = task['frame']
+            task_id = task.get('task_id')
+            task_ts = task.get('timestamp')
+
+            if self.debug_log:
+                try:
+                    age_s = (time.time() - task_ts) if task_ts else None
+                    logger.info(
+                        "Worker got task cam=%s task_id=%s age_s=%s frame_std=%s rois=%d in_q=%d",
+                        cam_id,
+                        task_id,
+                        (f"{age_s:.3f}" if age_s is not None else "n/a"),
+                        task.get('frame_std'),
+                        len(rois) if rois else 0,
+                        self.input_queue.qsize(),
+                    )
+                except Exception:
+                    pass

            try:
-                # 1. Crop all ROIs
+                t0 = time.time()
                crops = self._crop_rois(frame, rois)
-                if not crops: continue
+                t_crop = time.time()

-                # 2. Batch Predict (Optimized Step)
-                digits = self.predict_batch(crops)
+                if not crops:
+                    self._put_result({
+                        'type': 'error',
+                        'camera_id': cam_id,
+                        'message': 'No ROIs cropped',
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'total': t_crop - t0},
+                    })
+                    continue

-                # 3. Combine
-                valid_digits = [d for d in digits if d.isdigit()]
-                if len(valid_digits) == len(digits) and len(valid_digits) > 0:
-                    final_number = int("".join(valid_digits))
+                predictions = self.predict_batch(crops)
+                t_pred = time.time()

-                    self.result_queue.put({
+                valid_digits_str = []
+                confidences = []
+                low_conf_details = []
+
+                for i, p in enumerate(predictions):
+                    if p['confidence'] < self.CONFIDENCE_THRESHOLD:
+                        low_conf_details.append(
+                            f"Digit {i} conf {p['confidence']:.2f} < {self.CONFIDENCE_THRESHOLD}"
+                        )
+                    valid_digits_str.append(p['digit'])
+                    confidences.append(p['confidence'])
+
+                if low_conf_details:
+                    self._put_result({
+                        'type': 'error',
+                        'camera_id': cam_id,
+                        'message': f"Low confidence: {', '.join(low_conf_details)}",
+                        'digits': valid_digits_str,
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'predict': t_pred - t_crop, 'total': t_pred - t0},
+                    })
+                    continue
+
+                if not valid_digits_str:
+                    self._put_result({
+                        'type': 'error',
+                        'camera_id': cam_id,
+                        'message': 'No digits produced',
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'predict': t_pred - t_crop, 'total': t_pred - t0},
+                    })
+                    continue
+
+                final_number_str = "".join(valid_digits_str)
+
+                try:
+                    final_number = int(final_number_str)
+                except ValueError:
+                    self._put_result({
+                        'type': 'error',
+                        'camera_id': cam_id,
+                        'message': f"Parse error: {valid_digits_str}",
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'predict': t_pred - t_crop, 'total': t_pred - t0},
+                    })
+                    continue
+
+                if self.MIN_VALUE <= final_number <= self.MAX_VALUE:
+                    avg_conf = float(np.mean(confidences)) if confidences else None
+                    self._put_result({
+                        'type': 'success',
                        'camera_id': cam_id,
                        'value': final_number,
-                        'digits': valid_digits
+                        'digits': valid_digits_str,
+                        'confidence': avg_conf,
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'predict': t_pred - t_crop, 'total': t_pred - t0},
+                    })
+                    self.processed_tasks += 1
+                else:
+                    self._put_result({
+                        'type': 'error',
+                        'camera_id': cam_id,
+                        'message': f"Value {final_number} out of range ({self.MIN_VALUE}-{self.MAX_VALUE})",
+                        'value': final_number,
+                        'task_id': task_id,
+                        'task_ts': task_ts,
+                        'timing_s': {'crop': t_crop - t0, 'predict': t_pred - t_crop, 'total': t_pred - t0},
                    })

-            except Exception as e:
-                logger.error(f"Inference error for {cam_id}: {e}")
+            except Exception:
+                logger.exception("Inference error cam=%s task_id=%s", cam_id, task_id)
+                self._put_result({
+                    'type': 'error',
+                    'camera_id': cam_id,
+                    'message': 'Exception during inference; see logs',
+                    'task_id': task_id,
+                    'task_ts': task_ts,
+                })

    def _crop_rois(self, image, roi_list):
        cropped_images = []
        for roi in roi_list:
            try:
                x, y, w, h = roi['x'], roi['y'], roi['width'], roi['height']
-                cropped = image[y:y+h, x:x+w]
+                cropped = image[y:y + h, x:x + w]
                if cropped.size > 0:
                    cropped_images.append(cropped)
            except Exception:
@ -111,55 +267,60 @@ class InferenceWorker:
        return cropped_images

    def predict_batch(self, images):
-        """Run inference on a batch of images at once."""
-        with self.lock:              # <--- Add this wrapper
-            if not self.interpreter: return []
+        """Run inference on a batch of images.
+
+        Returns list of dicts: {'digit': str, 'confidence': float}
+        """
+        with self.lock:
+            if not self.interpreter:
+                return []

            num_images = len(images)
-            if num_images == 0: return []
+            if num_images == 0:
+                return []

            input_index = self.input_details[0]['index']
            output_index = self.output_details[0]['index']

-            # Preprocess all images into a single batch array
-            # Shape: [N, 32, 20, 3] (assuming model expects 32x20 rgb)
            batch_input = []
-            
-            target_h, target_w = 32, 20  # Based on your previous code logic
+            target_h, target_w = 32, 20

            for img in images:
-                # Resize
                roi_resized = cv2.resize(img, (target_w, target_h))
-                # Color
                roi_rgb = cv2.cvtColor(roi_resized, cv2.COLOR_BGR2RGB)
-                # Normalize
                roi_norm = roi_rgb.astype(np.float32)
                batch_input.append(roi_norm)

-            # Create batch tensor
            input_tensor = np.array(batch_input)

-            # --- DYNAMIC RESIZING ---
-            # TFLite models have a fixed input size (usually batch=1).
-            # We must resize the input tensor to match our current batch size (N).
-            
-            # 1. Resize input tensor
+            # Keep current behavior (resize+allocate per batch). Debug timing is optional.
            self.interpreter.resize_tensor_input(input_index, [num_images, target_h, target_w, 3])
-            
-            # 2. Re-allocate tensors (This is expensive! See note below)
            self.interpreter.allocate_tensors()

-            # 3. Run Inference
            self.interpreter.set_tensor(input_index, input_tensor)
-            self.interpreter.invoke()

-            # 4. Get Results
+            t0 = time.time()
+            self.interpreter.invoke()
+            self.last_invoke_secs = time.time() - t0
+
+            if self.debug_log and self.last_invoke_secs and self.last_invoke_secs > 1.0:
+                logger.warning("Slow invoke: %.3fs (batch=%d)", self.last_invoke_secs, num_images)
+
            output_data = self.interpreter.get_tensor(output_index)

-            # Result shape is [N, 10] (probabilities for 10 digits)
-            predictions = []
+            results = []
            for i in range(num_images):
-                digit_class = np.argmax(output_data[i])
-                predictions.append(str(digit_class))
+                logits = output_data[i]

-            return predictions
+                # Numerically stable softmax
+                logits = logits - np.max(logits)
+                ex = np.exp(logits)
+                denom = np.sum(ex)
+                probs = (ex / denom) if denom != 0 else np.zeros_like(ex)
+
+                digit_class = int(np.argmax(probs))
+                confidence = float(probs[digit_class]) if probs.size else 0.0
+
+                results.append({'digit': str(digit_class), 'confidence': confidence})
+
+            return results
--- a/readme.md
+++ b/readme.md
@ -0,0 +1,63 @@
+# RTSPCamDigitDetection Backend
+
+This service reads frames from one or more RTSP cameras, crops user-defined ROIs (Regions of Interest) containing 7‑segment digits, runs a TensorFlow Lite digit classifier, and publishes the assembled numeric value to MQTT (e.g., for Home Assistant) [code_file:9][code_file:11].
+
+It also exposes a Flask web UI/API for live video previews, snapshots, and ROI configuration [code_file:9].
+
+## High-Level Architecture
+
+*   **`app.py` (Main Service):** Runs the Flask web server and the main processing loop. It drains results from the inference worker, handles MQTT publishing, and manages the rate-limiting logic per camera [code_file:9].
+*   **`inference.py` (Worker):** A background thread that performs the heavy lifting. It accepts frames, crops the ROIs, runs the TFLite model, and validates results against confidence thresholds and numeric ranges [code_file:11].
+*   **`manager.py` & `camera.py`:** Handles the RTSP connections, frame buffering, and camera configuration management.
+
+## Configuration
+
+Configuration variables are defined directly at the top of the scripts for simplicity.
+
+### 1. Main Settings (`app.py`)
+Edit the top section of `app.py` to change these [code_file:9]:
+
+*   **`DEBUG_LOG`** *(bool)*:
+    *   `True`: Enables verbose logging (heartbeats every 5s, per-task timing, detailed skip reasons).
+    *   `False`: Quiet mode. Only prints crucial info (MQTT publishes, connection errors). Warnings about skipped frames are rate-limited to once per minute to prevent log flooding.
+*   **`DETECTION_INTERVAL`** *(int)*:
+    *   How often (in seconds) to attempt a detection for each camera (Default: `10`).
+*   **`FRAME_STD_THRESHOLD`** *(float)*:
+    *   Standard Deviation threshold to filter out "bad" frames before inference.
+    *   Frames with contrast lower than this value are skipped.
+    *   *Recommendation:* Set to `0` or `1` if your valid digits are low-contrast. Set higher (e.g., `25`) only if you need to filter out specific gray/green encoding artifacts.
+
+### 2. Inference Settings (`inference.py`)
+Edit the top section of `inference.py` to tune the AI [code_file:11]:
+
+*   **`CONFIDENCE_THRESHOLD`** *(0.0 - 1.0)*:
+    *   Minimum confidence required for a digit to be accepted.
+    *   *Recommendation:* `0.85` is a good balance to prevent false positives like "1010" while accepting valid digits.
+*   **`MIN_VALUE` / `MAX_VALUE`** *(int)*:
+    *   Sanity check range. Decoded numbers outside this range (e.g., `1010`) are discarded.
+
+## How It Works (Logic & Logging)
+
+### The "10s vs 60s" Behavior
+You might notice that successful detections are logged every **10 seconds**, but errors (like "Value out of range") appear only every **60 seconds**.
+*   **Success:** The app attempts detection every `DETECTION_INTERVAL` (10s). Every success is logged immediately as INFO.
+*   **Failure:** If the camera feed is bad or the value is out of range, the error technically occurs every 10s. However, when `DEBUG_LOG = False`, these repetitive warnings are suppressed and only printed **once per minute** to keep the CLI readable [code_file:9].
+
+### MQTT Behavior
+*   **Topic:** `homeassistant/sensor/RTSPCamDigitDetection/state/<camera_id>`
+*   **Payload:** `{"value": 42, "confidence": 0.98}`
+*   **Trigger:** Published only on **successful** detection and validation. Errors are not published to this topic to avoid messing up sensor history.
+
+## API Endpoints
+
+The app runs on port `5000` by default [code_file:9].
+
+| Method | Endpoint | Description |
+| :--- | :--- | :--- |
+| `GET` | `/` | Web UI Entry point. |
+| `GET` | `/video/<camera_id>` | MJPEG stream for live preview. |
+| `GET` | `/snapshot/<camera_id>` | Capture a single JPEG snapshot. |
+| `GET` | `/cameras` | List configured cameras. |
+| `GET` | `/rois/<camera_id>` | Get current ROI definitions. |
+| `POST` | `/save_rois` | Save new ROI definitions to disk. |
+| `POST` | `/detect_digits` | Manual trigger: runs inference immediately and returns full debug details (JSON). |
Author	SHA1	Message	Date
Bora	6efcad9cdf	5: readme	2026-01-01 11:39:26 +01:00
Bora	cfc74cc3f2	4: debugging flag	2026-01-01 11:28:57 +01:00
Bora	8d1b45ce73	3	2026-01-01 11:20:05 +01:00
Bora	78487918e4	2	2026-01-01 10:07:37 +01:00
Bora	5dae5b86c0	1	2026-01-01 09:53:11 +01:00