127 lines
5.5 KiB
SQL
127 lines
5.5 KiB
SQL
-- ============================================================================
|
|
-- PROJET : Moteur de Détection de Menaces HTTP
|
|
-- DESCRIPTION : Reconfiguration des vues d'agrégation, nouveauté et scoring.
|
|
-- DATE : 2026-03-08
|
|
-- ============================================================================
|
|
|
|
-- ----------------------------------------------------------------------------
|
|
-- 1. NETTOYAGE DES OBJETS EXISTANTS (Ordre inverse des dépendances)
|
|
-- ----------------------------------------------------------------------------
|
|
DROP VIEW IF EXISTS mabase_prod.live_threat_scores;
|
|
DROP VIEW IF EXISTS mabase_prod.mv_baseline_update;
|
|
DROP VIEW IF EXISTS mabase_prod.mv_novelty;
|
|
DROP VIEW IF EXISTS mabase_prod.mv_traffic_1d;
|
|
DROP VIEW IF EXISTS mabase_prod.mv_traffic_1h;
|
|
DROP VIEW IF EXISTS mabase_prod.mv_traffic_1m;
|
|
|
|
-- ----------------------------------------------------------------------------
|
|
-- 2. RECONSTRUCTION DE LA CHAÎNE DE ROLLUP (Aggrégations temporelles)
|
|
-- ----------------------------------------------------------------------------
|
|
|
|
-- MV 1 Minute : Transformation des logs bruts en métriques techniques
|
|
CREATE MATERIALIZED VIEW mabase_prod.mv_traffic_1m
|
|
TO mabase_prod.agg_traffic_1m
|
|
AS SELECT
|
|
toStartOfMinute(time) AS minute,
|
|
host, src_ip, src_asn, src_country_code, ja4, ja3_hash, header_user_agent,
|
|
countState() AS hits,
|
|
uniqState(path) AS uniq_paths,
|
|
avgState(syn_to_clienthello_ms) AS avg_syn_to_clienthello_ms,
|
|
varPopState(syn_to_clienthello_ms) AS var_syn_to_clienthello_ms,
|
|
avgState(toFloat64((length(client_headers) - length(replaceAll(client_headers, ',', ''))) + 1)) AS avg_headers_count,
|
|
countIfState((header_user_agent ILIKE '%Chrome%') AND (ja4 NOT ILIKE 't13d%')) AS spoofing_ua_tls,
|
|
countIfState((header_user_agent ILIKE '%Chrome%') AND (tls_alpn NOT ILIKE '%h2%')) AS spoofing_ua_alpn,
|
|
countIfState((header_user_agent ILIKE '%Windows%') AND (ip_meta_ttl <= 64)) AS spoofing_os_ttl,
|
|
countIfState((header_accept_language = '') OR (header_sec_ch_ua = '')) AS missing_human_headers,
|
|
countIfState(method IN ('PUT', 'DELETE', 'OPTIONS', 'TRACE')) AS suspicious_methods,
|
|
countIfState((length(query) > 200) OR match(query, '(%[0-9A-Fa-f]{2}){5,}')) AS suspicious_queries
|
|
FROM mabase_prod.http_logs
|
|
GROUP BY minute, host, src_ip, src_asn, src_country_code, ja4, ja3_hash, header_user_agent;
|
|
|
|
-- MV 1 Heure : Agrégation secondaire (Cascading)
|
|
CREATE MATERIALIZED VIEW mabase_prod.mv_traffic_1h
|
|
TO mabase_prod.agg_traffic_1h
|
|
AS SELECT
|
|
toStartOfHour(minute) AS hour,
|
|
host, src_country_code, ja4, ja3_hash, header_user_agent,
|
|
countMergeState(hits) AS hits,
|
|
uniqMergeState(uniq_paths) AS uniq_paths,
|
|
countIfMergeState(missing_human_headers) AS missing_human_headers,
|
|
uniqState(src_ip) AS uniq_ips
|
|
FROM mabase_prod.agg_traffic_1m
|
|
GROUP BY hour, host, src_country_code, ja4, ja3_hash, header_user_agent;
|
|
|
|
-- MV 1 Jour : Agrégation tertiaire pour archivage et baseline
|
|
CREATE MATERIALIZED VIEW mabase_prod.mv_traffic_1d
|
|
TO mabase_prod.agg_traffic_1d
|
|
AS SELECT
|
|
toDate(hour) AS day,
|
|
host, src_country_code, ja4, ja3_hash, header_user_agent,
|
|
countMergeState(hits) AS hits,
|
|
uniqMergeState(uniq_ips) AS uniq_ips,
|
|
uniqMergeState(uniq_paths) AS uniq_paths,
|
|
countIfMergeState(missing_human_headers) AS missing_human_headers
|
|
FROM mabase_prod.agg_traffic_1h
|
|
GROUP BY day, host, src_country_code, ja4, ja3_hash, header_user_agent;
|
|
|
|
-- ----------------------------------------------------------------------------
|
|
-- 3. RECONSTRUCTION DES BRIQUES D'INTELLIGENCE (Novelty & Baseline)
|
|
-- ----------------------------------------------------------------------------
|
|
|
|
-- MV Novelty : Détection de nouvelles empreintes (HTTP + TLS)
|
|
CREATE MATERIALIZED VIEW mabase_prod.mv_novelty
|
|
TO mabase_prod.agg_novelty
|
|
AS SELECT
|
|
host,
|
|
ja4,
|
|
cityHash64(client_headers) AS http_fp,
|
|
minState(time) AS first_seen,
|
|
maxState(time) AS last_seen,
|
|
countState() AS total_hits
|
|
FROM mabase_prod.http_logs
|
|
GROUP BY host, ja4, http_fp;
|
|
|
|
-- MV Baseline : Calcul statistique du trafic normal par JA4
|
|
CREATE MATERIALIZED VIEW mabase_prod.mv_baseline_update
|
|
TO mabase_prod.tbl_baseline_ja4_7d
|
|
AS SELECT
|
|
ja4,
|
|
quantile(0.99)(hourly_hits) AS p99_hits_per_hour,
|
|
avg(hourly_hits) AS avg_hits_per_hour,
|
|
now() AS last_update
|
|
FROM (
|
|
SELECT
|
|
ja4,
|
|
toStartOfHour(minute) as hour,
|
|
countMerge(hits) AS hourly_hits
|
|
FROM mabase_prod.agg_traffic_1m
|
|
WHERE minute >= now() - INTERVAL 7 DAY
|
|
GROUP BY ja4, hour
|
|
)
|
|
GROUP BY ja4;
|
|
|
|
-- ----------------------------------------------------------------------------
|
|
-- 4. VUE DE SCORING FINAL (Verdict Temps Réel)
|
|
-- ----------------------------------------------------------------------------
|
|
|
|
CREATE VIEW mabase_prod.live_threat_scores AS
|
|
SELECT
|
|
T1.src_ip,
|
|
T1.ja4,
|
|
T1.src_asn,
|
|
T1.src_country_code,
|
|
(
|
|
if(countMerge(T1.spoofing_ua_tls) > 0, 40, 0) +
|
|
if(countMerge(T1.spoofing_os_ttl) > 0, 40, 0) +
|
|
if(varPopMerge(T1.var_syn_to_clienthello_ms) < 1.0, 20, 0) +
|
|
if(dateDiff('hour', minMerge(N.first_seen), now()) < 2, 30, 0) +
|
|
if(countMerge(T1.hits) > coalesce(B.p99_hits_per_hour * 3, 1000), 50, 0)
|
|
) AS final_score,
|
|
countMerge(T1.hits) AS current_hits,
|
|
B.p99_hits_per_hour AS historical_baseline
|
|
FROM mabase_prod.agg_traffic_1m AS T1
|
|
LEFT JOIN mabase_prod.agg_novelty AS N ON T1.ja4 = N.ja4 AND T1.host = N.host
|
|
LEFT JOIN mabase_prod.tbl_baseline_ja4_7d AS B ON T1.ja4 = B.ja4
|
|
WHERE T1.minute >= now() - INTERVAL 5 MINUTE
|
|
GROUP BY T1.src_ip, T1.ja4, T1.src_asn, T1.src_country_code, B.p99_hits_per_hour;
|