fix: correct CampaignsView, analysis.py IPv4 split, entities date filter

- CampaignsView: update ClusterData interface to match real API response (severity/unique_ips/score instead of threat_level/total_ips/confidence_range) Fix fetch to use data.items, rewrite ClusterCard and BehavioralTab Remove unused getClassificationColor and THREAT_ORDER constants - analysis.py: fix IPv4Address object has no attribute 'split' on line 322 Add str() conversion before calling .split('.') - entities.py: fix Date vs DateTime comparison — log_date is a Date column, comparing against now()-INTERVAL HOUR caused yesterday's entries to be excluded Use toDate(now() - INTERVAL X HOUR) for correct Date-level comparison Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
2026-03-15 23:10:35 +01:00
parent 8d35b91642
commit 1455e04303
50 changed files with 5442 additions and 7325 deletions
--- a/backend/routes/incidents.py
+++ b/backend/routes/incidents.py
@ -81,25 +81,94 @@ async def get_incident_clusters(

        result = db.query(cluster_query, {"hours": hours, "limit": limit})
        
+        # Collect sample IPs to fetch real UA and trend data in bulk
+        sample_ips = [row[10] for row in result.result_rows if row[10]]
+        subnets_list = [row[0] for row in result.result_rows]
+
+        # Fetch real primary UA per sample IP from view_dashboard_entities
+        ua_by_ip: dict = {}
+        if sample_ips:
+            ip_list_sql = ", ".join(f"'{ip}'" for ip in sample_ips[:50])
+            ua_query = f"""
+            SELECT entity_value, arrayElement(user_agents, 1) AS top_ua
+            FROM view_dashboard_entities
+            WHERE entity_type = 'ip'
+              AND entity_value IN ({ip_list_sql})
+              AND notEmpty(user_agents)
+            GROUP BY entity_value, top_ua
+            ORDER BY entity_value
+            """
+            try:
+                ua_result = db.query(ua_query)
+                for ua_row in ua_result.result_rows:
+                    if ua_row[0] not in ua_by_ip and ua_row[1]:
+                        ua_by_ip[str(ua_row[0])] = str(ua_row[1])
+            except Exception:
+                pass  # UA enrichment is best-effort
+
+        # Compute real trend: compare current window vs previous window of same duration
+        trend_query = """
+        WITH cleaned AS (
+            SELECT
+                replaceRegexpAll(toString(src_ip), '^::ffff:', '') AS clean_ip,
+                detected_at,
+                concat(
+                    splitByChar('.', clean_ip)[1], '.',
+                    splitByChar('.', clean_ip)[2], '.',
+                    splitByChar('.', clean_ip)[3], '.0/24'
+                ) AS subnet
+            FROM ml_detected_anomalies
+        ),
+        current_window AS (
+            SELECT subnet, count() AS cnt
+            FROM cleaned
+            WHERE detected_at >= now() - INTERVAL %(hours)s HOUR
+            GROUP BY subnet
+        ),
+        prev_window AS (
+            SELECT subnet, count() AS cnt
+            FROM cleaned
+            WHERE detected_at >= now() - INTERVAL %(hours2)s HOUR
+              AND detected_at < now() - INTERVAL %(hours)s HOUR
+            GROUP BY subnet
+        )
+        SELECT c.subnet, c.cnt AS current_cnt, p.cnt AS prev_cnt
+        FROM current_window c
+        LEFT JOIN prev_window p ON c.subnet = p.subnet
+        """
+        trend_by_subnet: dict = {}
+        try:
+            trend_result = db.query(trend_query, {"hours": hours, "hours2": hours * 2})
+            for tr in trend_result.result_rows:
+                subnet_key = tr[0]
+                curr = tr[1] or 0
+                prev = tr[2] or 0
+                if prev == 0:
+                    trend_by_subnet[subnet_key] = ("new", 100)
+                else:
+                    pct = round(((curr - prev) / prev) * 100)
+                    trend_by_subnet[subnet_key] = ("up" if pct >= 0 else "down", abs(pct))
+        except Exception:
+            pass
+
        clusters = []
        for row in result.result_rows:
-            # Calcul du score de risque
+            subnet = row[0]
            threat_level = row[8] or 'LOW'
            unique_ips = row[2] or 1
            avg_score = abs(row[9] or 0)
-            
-            # Score based on threat level and other factors
+            sample_ip = row[10] if row[10] else subnet.split('/')[0]
+
            critical_count = 1 if threat_level == 'CRITICAL' else 0
            high_count = 1 if threat_level == 'HIGH' else 0
-            
+
            risk_score = min(100, round(
-                (critical_count * 30) + 
-                (high_count * 20) + 
-                (unique_ips * 5) + 
+                (critical_count * 30) +
+                (high_count * 20) +
+                (unique_ips * 5) +
                (avg_score * 100)
            ))
-            
-            # Détermination de la sévérité
+
            if critical_count > 0 or risk_score >= 80:
                severity = "CRITICAL"
            elif high_count > (row[1] or 1) * 0.3 or risk_score >= 60:
@ -108,31 +177,27 @@ async def get_incident_clusters(
                severity = "MEDIUM"
            else:
                severity = "LOW"
-            
-            # Calcul de la tendance
-            trend = "up"
-            trend_percentage = 23
-            
+
+            trend_dir, trend_pct = trend_by_subnet.get(subnet, ("stable", 0))
+            primary_ua = ua_by_ip.get(sample_ip, "")
+
            clusters.append({
                "id": f"INC-{datetime.now().strftime('%Y%m%d')}-{len(clusters)+1:03d}",
                "score": risk_score,
                "severity": severity,
                "total_detections": row[1],
                "unique_ips": row[2],
-                "subnet": row[0],
-                "sample_ip": row[10] if row[10] else row[0].split('/')[0],
+                "subnet": subnet,
+                "sample_ip": sample_ip,
                "ja4": row[5] or "",
-                "primary_ua": "python-requests",
-                "primary_target": "Unknown",
-                "countries": [{
-                    "code": row[6] or "XX",
-                    "percentage": 100
-                }],
+                "primary_ua": primary_ua,
+                "primary_target": row[3].strftime('%H:%M') if row[3] else "Unknown",
+                "countries": [{"code": row[6] or "XX", "percentage": 100}],
                "asn": str(row[7]) if row[7] else "",
                "first_seen": row[3].isoformat() if row[3] else "",
                "last_seen": row[4].isoformat() if row[4] else "",
-                "trend": trend,
-                "trend_percentage": trend_percentage
+                "trend": trend_dir,
+                "trend_percentage": trend_pct,
            })
        
        return {