From 0fe8c124dae498de0d0c0b1db444598ebb1e75b2 Mon Sep 17 00:00:00 2001
From: Riddhi <Riddhipachehara@gmail.com>
Date: Wed, 11 Feb 2026 14:49:52 +0530
Subject: [PATCH 1/3] Add failing test for OpenAPI lifespan safety

---
 backend/app/__init__.py                |  0
 backend/tests/test_openapi_lifespan.py | 24 ++++++++++++++++++++++++
 2 files changed, 24 insertions(+)
 create mode 100644 backend/app/__init__.py
 create mode 100644 backend/tests/test_openapi_lifespan.py

diff --git a/backend/app/__init__.py b/backend/app/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/backend/tests/test_openapi_lifespan.py b/backend/tests/test_openapi_lifespan.py
new file mode 100644
index 000000000..e1b8b025e
--- /dev/null
+++ b/backend/tests/test_openapi_lifespan.py
@@ -0,0 +1,24 @@
+import pytest
+from fastapi import FastAPI
+from main import generate_openapi_json
+
+
+def test_openapi_failure_does_not_crash_app(monkeypatch):
+    def broken_openapi(*args, **kwargs):
+        raise Exception("Simulated failure")
+
+    monkeypatch.setattr(
+        "main.get_openapi",
+        broken_openapi
+    )
+
+    app = FastAPI()
+
+    try:
+        generate_openapi_json()
+        started = True
+    except Exception:
+        started = False
+
+    assert started, "App should not crash if OpenAPI generation fails"
+

From 9fb411868eff1a71ea97d5686ec28010cae6176d Mon Sep 17 00:00:00 2001
From: Riddhi <Riddhipachehara@gmail.com>
Date: Wed, 18 Feb 2026 19:59:01 +0530
Subject: [PATCH 2/3] docs: explain why lifespan should not run during OpenAPI

---
 backend/tests/test_openapi_lifespan.py | 31 +++++++++++++++++---------
 1 file changed, 21 insertions(+), 10 deletions(-)

diff --git a/backend/tests/test_openapi_lifespan.py b/backend/tests/test_openapi_lifespan.py
index e1b8b025e..5118f00ca 100644
--- a/backend/tests/test_openapi_lifespan.py
+++ b/backend/tests/test_openapi_lifespan.py
@@ -3,22 +3,33 @@
 from main import generate_openapi_json
 
 
-def test_openapi_failure_does_not_crash_app(monkeypatch):
+def test_openapi_failure_does_not_trigger_lifespan(monkeypatch):
+    """
+    OpenAPI generation should not trigger application lifespan events.
+    Running lifespan during schema generation can cause unwanted side effects
+    like starting DB connections, background workers, or external services.
+    """
+
+    lifespan_called = {"count": 0}
+
+    # Fake lifespan function
+    async def fake_lifespan(app: FastAPI):
+        lifespan_called["count"] += 1
+        yield
+
+    # Force OpenAPI to fail
     def broken_openapi(*args, **kwargs):
         raise Exception("Simulated failure")
 
-    monkeypatch.setattr(
-        "main.get_openapi",
-        broken_openapi
-    )
+    monkeypatch.setattr("main.get_openapi", broken_openapi)
 
-    app = FastAPI()
+    # Create app with custom lifespan
+    app = FastAPI(lifespan=fake_lifespan)
 
     try:
         generate_openapi_json()
-        started = True
     except Exception:
-        started = False
-
-    assert started, "App should not crash if OpenAPI generation fails"
+        pass
 
+    # This is the real assertion the bot wanted
+    assert lifespan_called["count"] == 0, "Lifespan should not run if OpenAPI fails"
\ No newline at end of file

From b8c75f3ca9be1d796da96b2267e37b4803d2fcf7 Mon Sep 17 00:00:00 2001
From: Riddhi <Riddhipachehara@gmail.com>
Date: Mon, 23 Feb 2026 21:55:52 +0530
Subject: [PATCH 3/3] Add deterministic unit tests for face_clusters utilities

---
 backend/app/__init__.py                       |  1 +
 backend/app/services/face_cluster_service.py  | 78 +++++++++++++++++++
 .../tests/clustering/test_face_clustering.py  | 46 +++++++++++
 .../tests/test_face_clustering_algorithm.py   | 67 ++++++++++++++++
 backend/tests/test_face_clusters_utils.py     | 52 +++++++++++++
 5 files changed, 244 insertions(+)
 create mode 100644 backend/app/services/face_cluster_service.py
 create mode 100644 backend/tests/clustering/test_face_clustering.py
 create mode 100644 backend/tests/test_face_clustering_algorithm.py
 create mode 100644 backend/tests/test_face_clusters_utils.py

diff --git a/backend/app/__init__.py b/backend/app/__init__.py
index e69de29bb..5dd8fd024 100644
--- a/backend/app/__init__.py
+++ b/backend/app/__init__.py
@@ -0,0 +1 @@
+#empty
\ No newline at end of file
diff --git a/backend/app/services/face_cluster_service.py b/backend/app/services/face_cluster_service.py
new file mode 100644
index 000000000..648b06334
--- /dev/null
+++ b/backend/app/services/face_cluster_service.py
@@ -0,0 +1,78 @@
+from typing import Optional
+from fastapi import HTTPException, status
+
+from app.database.face_clusters import (
+    db_get_cluster_by_id,
+    db_update_cluster,
+)
+from app.schemas.face_clusters import (
+    RenameClusterRequest,
+    RenameClusterResponse,
+    RenameClusterData,
+)
+from app.schemas.API import ErrorResponse
+
+
+def rename_cluster_service(cluster_id: str, request: RenameClusterRequest) -> RenameClusterResponse:
+    """
+    Service layer for renaming a face cluster.
+    Handles validation and business logic.
+    """
+
+    # Validation
+    if not cluster_id.strip():
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=ErrorResponse(
+                success=False,
+                error="Validation Error",
+                message="Cluster ID cannot be empty",
+            ).model_dump(),
+        )
+
+    if not request.cluster_name.strip():
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=ErrorResponse(
+                success=False,
+                error="Validation Error",
+                message="Cluster name cannot be empty",
+            ).model_dump(),
+        )
+
+    # Check existence
+    existing_cluster = db_get_cluster_by_id(cluster_id)
+    if not existing_cluster:
+        raise HTTPException(
+            status_code=status.HTTP_404_NOT_FOUND,
+            detail=ErrorResponse(
+                success=False,
+                error="Cluster Not Found",
+                message=f"Cluster with ID '{cluster_id}' does not exist.",
+            ).model_dump(),
+        )
+
+    # Update
+    updated = db_update_cluster(
+        cluster_id=cluster_id,
+        cluster_name=request.cluster_name.strip(),
+    )
+
+    if not updated:
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=ErrorResponse(
+                success=False,
+                error="Update Failed",
+                message=f"Failed to update cluster '{cluster_id}'.",
+            ).model_dump(),
+        )
+
+    return RenameClusterResponse(
+        success=True,
+        message=f"Successfully renamed cluster to '{request.cluster_name}'",
+        data=RenameClusterData(
+            cluster_id=cluster_id,
+            cluster_name=request.cluster_name.strip(),
+        ),
+    )
\ No newline at end of file
diff --git a/backend/tests/clustering/test_face_clustering.py b/backend/tests/clustering/test_face_clustering.py
new file mode 100644
index 000000000..d1f91f334
--- /dev/null
+++ b/backend/tests/clustering/test_face_clustering.py
@@ -0,0 +1,46 @@
+import numpy as np
+from app.utils.face_clusters import _validate_embedding, _calculate_cosine_distances
+
+
+def test_validate_embedding_valid():
+    embedding = np.array([0.5, 0.4, 0.3])
+    assert _validate_embedding(embedding) is True
+
+
+def test_validate_embedding_zero_vector():
+    embedding = np.array([0.0, 0.0, 0.0])
+    assert _validate_embedding(embedding) is False
+
+
+def test_validate_embedding_nan():
+    embedding = np.array([0.1, np.nan, 0.3])
+    assert _validate_embedding(embedding) is False
+
+
+def test_calculate_cosine_distances_basic():
+    face_embedding = np.array([1.0, 0.0])
+    cluster_means = np.array([
+        [1.0, 0.0],
+        [0.0, 1.0]
+    ])
+
+    distances = _calculate_cosine_distances(face_embedding, cluster_means)
+
+    # First cluster identical → distance close to 0
+    assert distances[0] < 0.01
+
+    # Second cluster orthogonal → distance close to 1
+    assert 0.9 < distances[1] <= 1.0
+
+
+def test_calculate_cosine_distances_zero_vector():
+    face_embedding = np.array([0.0, 0.0])
+    cluster_means = np.array([
+        [1.0, 0.0],
+        [0.0, 1.0]
+    ])
+
+    distances = _calculate_cosine_distances(face_embedding, cluster_means)
+
+    # Zero vector should return max distances
+    assert all(d == 1.0 for d in distances)
\ No newline at end of file
diff --git a/backend/tests/test_face_clustering_algorithm.py b/backend/tests/test_face_clustering_algorithm.py
new file mode 100644
index 000000000..6df045332
--- /dev/null
+++ b/backend/tests/test_face_clustering_algorithm.py
@@ -0,0 +1,67 @@
+import numpy as np
+from app.utils.face_clusters import cluster_util_cluster_all_face_embeddings
+
+
+def test_dbscan_clusters_two_groups(monkeypatch):
+    """
+    Ensure clustering groups similar embeddings together.
+    """
+
+    cluster_1 = np.array([[1, 0, 0], [0.98, 0.02, 0]])
+    cluster_2 = np.array([[0, 1, 0], [0.02, 0.99, 0]])
+
+    embeddings = np.vstack([cluster_1, cluster_2])
+
+    fake_faces = [
+        {
+            "face_id": i + 1,
+            "embeddings": embeddings[i],
+            "cluster_name": None,
+        }
+        for i in range(len(embeddings))
+    ]
+
+    def mock_get_all_faces():
+        return fake_faces
+
+    monkeypatch.setattr(
+        "app.utils.face_clusters.db_get_all_faces_with_cluster_names",
+        mock_get_all_faces,
+    )
+
+    results = cluster_util_cluster_all_face_embeddings(
+        eps=0.3, min_samples=1, similarity_threshold=0.5
+    )
+
+    assert len(results) == 4
+
+    cluster_ids = set([r.cluster_uuid for r in results])
+    assert len(cluster_ids) == 2
+
+
+def test_clustering_skips_invalid_embeddings(monkeypatch):
+    """
+    Ensure invalid embeddings (zero vector) are skipped.
+    """
+
+    valid_embedding = np.array([1, 0, 0])
+    invalid_embedding = np.array([0, 0, 0])
+
+    fake_faces = [
+        {"face_id": 1, "embeddings": valid_embedding, "cluster_name": None},
+        {"face_id": 2, "embeddings": invalid_embedding, "cluster_name": None},
+    ]
+
+    def mock_get_all_faces():
+        return fake_faces
+
+    monkeypatch.setattr(
+        "app.utils.face_clusters.db_get_all_faces_with_cluster_names",
+        mock_get_all_faces,
+    )
+
+    results = cluster_util_cluster_all_face_embeddings(
+        eps=0.5, min_samples=1, similarity_threshold=0.5
+    )
+
+    assert len(results) == 1
\ No newline at end of file
diff --git a/backend/tests/test_face_clusters_utils.py b/backend/tests/test_face_clusters_utils.py
new file mode 100644
index 000000000..f71730df2
--- /dev/null
+++ b/backend/tests/test_face_clusters_utils.py
@@ -0,0 +1,52 @@
+import numpy as np
+import pytest
+
+from app.utils.face_clusters import _validate_embedding
+
+
+def test_validate_embedding_valid_vector():
+    """
+    Should return True for a normal non-zero finite embedding.
+    """
+    embedding = np.array([0.5, 0.2, 0.1])
+    assert _validate_embedding(embedding) is True
+
+
+def test_validate_embedding_zero_vector():
+    """
+    Should return False for zero vector (norm too small).
+    """
+    embedding = np.zeros(128)
+    assert _validate_embedding(embedding) is False
+
+
+def test_validate_embedding_nan_values():
+    """
+    Should return False if embedding contains NaN.
+    """
+    embedding = np.array([0.1, np.nan, 0.3])
+    assert _validate_embedding(embedding) is False
+
+
+def test_validate_embedding_inf_values():
+    """
+    Should return False if embedding contains infinite values.
+    """
+    embedding = np.array([0.1, np.inf, 0.3])
+    assert _validate_embedding(embedding) is False
+
+
+def test_validate_embedding_small_norm():
+    """
+    Should return False if norm is below threshold.
+    """
+    embedding = np.array([1e-12, 1e-12, 1e-12])
+    assert _validate_embedding(embedding, min_norm=1e-6) is False
+
+
+def test_validate_embedding_custom_min_norm():
+    """
+    Should respect custom min_norm parameter.
+    """
+    embedding = np.array([0.01, 0.01, 0.01])
+    assert _validate_embedding(embedding, min_norm=0.1) is False
\ No newline at end of file