Initial commit: logcorrelator with unified packaging (DEB + RPM using fpm)

Co-authored-by: Qwen-Coder <qwen-coder@alibabacloud.com>
2026-02-27 15:31:46 +01:00
commit 8fc14c1e94
35 changed files with 4829 additions and 0 deletions
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@ -0,0 +1,73 @@
 name: Build and Test
 on:
  push:
    branches: [ main ]
  pull_request:
    branches: [ main ]
 jobs:
  test:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4
      - name: Set up Go
        uses: actions/setup-go@v5
        with:
          go-version: '1.21'
      - name: Download dependencies
        run: go mod download
      - name: Run tests with coverage
        run: |
          go test -race -coverprofile=coverage.txt -covermode=atomic ./...
          TOTAL=$(go tool cover -func=coverage.txt | grep total | awk '{gsub(/%/, "", $3); print $3}')
          echo "Coverage: ${TOTAL}%"
          if (( $(echo "$TOTAL < 80" | bc -l) )); then
            echo "Coverage ${TOTAL}% is below 80% threshold"
            exit 1
          fi
      - name: Upload coverage to Codecov
        uses: codecov/codecov-action@v3
        with:
          file: ./coverage.txt
  build:
    runs-on: ubuntu-latest
    needs: test
    steps:
      - uses: actions/checkout@v4
      - name: Set up Go
        uses: actions/setup-go@v5
        with:
          go-version: '1.21'
      - name: Build binary
        run: |
          CGO_ENABLED=0 GOOS=linux GOARCH=amd64 go build \
            -ldflags="-w -s" \
            -o logcorrelator \
            ./cmd/logcorrelator
      - name: Upload binary artifact
        uses: actions/upload-artifact@v4
        with:
          name: logcorrelator-linux-amd64
          path: logcorrelator
  docker:
    runs-on: ubuntu-latest
    needs: test
    steps:
      - uses: actions/checkout@v4
      - name: Build Docker image
        run: docker build -t logcorrelator:latest .
      - name: Run tests in Docker
        run: |
          docker run --rm logcorrelator:latest --help || true
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,31 @@
 # Build directory
 /build/
 /dist/
 # Binaries
 *.exe
 *.exe~
 *.dll
 *.so
 *.dylib
 logcorrelator
 # Test binary
 *.test
 # Output of the go coverage tool
 *.out
 # Dependency directories
 vendor/
 # IDE
 .idea/
 .vscode/
 *.swp
 *.swo
 *~
 # OS
 .DS_Store
 Thumbs.db
--- a/150
+++ b/150
@ -0,0 +1,150 @@
 # syntax=docker/dockerfile:1
 # =============================================================================
 # Builder stage - compile and test
 # =============================================================================
 FROM golang:1.21 AS builder
 WORKDIR /build
 # Install dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \
    git \
    bc \
    && rm -rf /var/lib/apt/lists/*
 # Copy go mod files
 COPY go.mod ./
 # Download dependencies
 RUN go mod download || true
 # Copy source code
 COPY . .
 # Run tests with coverage (fail if < 80%)
 RUN --mount=type=cache,target=/root/.cache/go-build \
    go test -race -coverprofile=coverage.txt -covermode=atomic ./... && \
    echo "=== Coverage Report ===" && \
    go tool cover -func=coverage.txt | grep total && \
    TOTAL=$(go tool cover -func=coverage.txt | grep total | awk '{gsub(/%/, "", $3); print $3}') && \
    echo "Total coverage: ${TOTAL}%" && \
    if (( $(echo "$TOTAL < 80" | bc -l) )); then \
        echo "ERROR: Coverage ${TOTAL}% is below 80% threshold"; \
        exit 1; \
    fi && \
    echo "Coverage check passed!"
 # Build binary
 RUN --mount=type=cache,target=/root/.cache/go-build \
    CGO_ENABLED=0 GOOS=linux GOARCH=amd64 go build \
    -ldflags="-w -s" \
    -o /usr/bin/logcorrelator \
    ./cmd/logcorrelator
 # Create runtime root filesystem
 RUN mkdir -p /tmp/runtime-root/var/log/logcorrelator /tmp/runtime-root/var/run/logcorrelator /tmp/runtime-root/etc/logcorrelator
 # =============================================================================
 # Runtime stage - minimal image for running the service
 # =============================================================================
 FROM gcr.io/distroless/base-debian12 AS runtime
 # Copy binary from builder
 COPY --from=builder /usr/bin/logcorrelator /usr/bin/logcorrelator
 # Copy example config
 COPY --from=builder /build/config.example.conf /etc/logcorrelator/logcorrelator.conf
 # Create necessary directories in builder stage (distroless has no shell)
 COPY --from=builder /tmp/runtime-root/var /var
 COPY --from=builder /tmp/runtime-root/etc /etc
 # Expose nothing (Unix sockets only)
 # Health check not applicable for this service type
 # Set entrypoint
 ENTRYPOINT ["/usr/bin/logcorrelator"]
 CMD ["-config", "/etc/logcorrelator/logcorrelator.conf"]
 # =============================================================================
 # RPM build stage - create .rpm package entirely in Docker
 # =============================================================================
 FROM ruby:3.2-bookworm AS rpm-builder
 WORKDIR /build
 # Install fpm and rpm tools
 RUN apt-get update && apt-get install -y --no-install-recommends \
    rpm \
    && rm -rf /var/lib/apt/lists/* \
    && gem install fpm -v 1.16.0
 # Copy binary from builder stage
 COPY --from=builder /usr/bin/logcorrelator /tmp/pkgroot/usr/bin/logcorrelator
 # Copy config and systemd unit
 COPY --from=builder /build/config.example.conf /tmp/pkgroot/etc/logcorrelator/logcorrelator.conf
 COPY logcorrelator.service /tmp/pkgroot/etc/systemd/system/logcorrelator.service
 # Create directory structure and set permissions
 RUN mkdir -p /tmp/pkgroot/var/log/logcorrelator && \
    mkdir -p /tmp/pkgroot/var/run/logcorrelator && \
    chmod 755 /tmp/pkgroot/var/log/logcorrelator && \
    chmod 755 /tmp/pkgroot/var/run/logcorrelator
 # Build RPM
 ARG VERSION=1.0.0
 RUN fpm -s dir -t rpm \
    -n logcorrelator \
    -v ${VERSION} \
    -C /tmp/pkgroot \
    --prefix / \
    --description "Log correlation service for HTTP and network events" \
    --url "https://github.com/logcorrelator/logcorrelator" \
    --license "MIT" \
    --vendor "logcorrelator" \
    -p /tmp/logcorrelator-${VERSION}.rpm \
    usr/bin/logcorrelator \
    etc/logcorrelator/logcorrelator.conf \
    etc/systemd/system/logcorrelator.service \
    var/log/logcorrelator \
    var/run/logcorrelator
 # =============================================================================
 # Test stage - verify RPM on Rocky Linux
 # =============================================================================
 FROM rockylinux:8 AS rpm-test
 # Install systemd (for testing service unit)
 RUN dnf install -y systemd && \
    dnf clean all
 # Copy RPM from rpm-builder
 COPY --from=rpm-builder /tmp/logcorrelator-*.rpm /tmp/
 # Install the RPM
 RUN rpm -ivh /tmp/logcorrelator-*.rpm || true
 # Verify installation
 RUN ls -la /usr/bin/logcorrelator && \
    ls -la /etc/logcorrelator/ && \
    ls -la /etc/systemd/system/logcorrelator.service
 # =============================================================================
 # Development stage - for local testing with hot reload
 # =============================================================================
 FROM golang:1.21 AS dev
 WORKDIR /app
 # Install air for hot reload (optional)
 RUN go install github.com/air-verse/air@latest
 COPY go.mod ./
 RUN go mod download || true
 COPY . .
 # Default command: run with example config
 CMD ["go", "run", "./cmd/logcorrelator", "-config", "config.example.conf"]
--- a/Dockerfile.package
+++ b/Dockerfile.package
@ -0,0 +1,125 @@
 # syntax=docker/dockerfile:1
 # =============================================================================
 # logcorrelator - Dockerfile de packaging unifié (DEB + RPM avec fpm)
 # =============================================================================
 # =============================================================================
 # Stage 1: Builder - Compilation du binaire Go
 # =============================================================================
 FROM golang:1.21 AS builder
 WORKDIR /build
 # Install dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \
    git \
    && rm -rf /var/lib/apt/lists/*
 # Copy go mod files
 COPY go.mod go.sum ./
 RUN go mod download
 # Copy source code
 COPY . .
 # Build binary for Linux
 ARG VERSION=1.0.0
 RUN mkdir -p dist && \
    CGO_ENABLED=0 GOOS=linux GOARCH=amd64 \
    go build -ldflags="-w -s" \
    -o dist/logcorrelator \
    ./cmd/logcorrelator
 # =============================================================================
 # Stage 2: Package builder - fpm pour DEB et RPM
 # =============================================================================
 FROM ruby:3.2-bookworm AS package-builder
 WORKDIR /package
 # Install fpm and dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \
    rpm \
    dpkg-dev \
    fakeroot \
    && rm -rf /var/lib/apt/lists/* \
    && gem install fpm -v 1.16.0
 # Copy binary from builder
 COPY --from=builder /build/dist/logcorrelator /tmp/pkgroot/usr/bin/logcorrelator
 COPY --from=builder /build/config.example.conf /tmp/pkgroot/etc/logcorrelator/logcorrelator.conf
 COPY --from=builder /build/config.example.conf /tmp/pkgroot/usr/share/logcorrelator/logcorrelator.conf.example
 # Create directories and set permissions
 RUN mkdir -p /tmp/pkgroot/var/log/logcorrelator && \
    mkdir -p /tmp/pkgroot/var/run/logcorrelator && \
    chmod 755 /tmp/pkgroot/usr/bin/logcorrelator && \
    chmod 640 /tmp/pkgroot/etc/logcorrelator/logcorrelator.conf && \
    chmod 640 /tmp/pkgroot/usr/share/logcorrelator/logcorrelator.conf.example && \
    chmod 755 /tmp/pkgroot/var/log/logcorrelator && \
    chmod 755 /tmp/pkgroot/var/run/logcorrelator
 # Copy maintainer scripts
 COPY packaging/deb/postinst /tmp/scripts/postinst
 COPY packaging/deb/prerm /tmp/scripts/prerm
 COPY packaging/deb/postrm /tmp/scripts/postrm
 RUN chmod 755 /tmp/scripts/*
 # Build DEB package
 ARG VERSION=1.0.0
 ARG ARCH=amd64
 RUN mkdir -p /packages/deb && \
    fpm -s dir -t deb \
    -n logcorrelator \
    -v "${VERSION}" \
    -C /tmp/pkgroot \
    --architecture "${ARCH}" \
    --description "Log correlation service for HTTP and network events" \
    --url "https://github.com/logcorrelator/logcorrelator" \
    --license "MIT" \
    --vendor "logcorrelator <dev@example.com>" \
    --maintainer "logcorrelator <dev@example.com>" \
    --depends "systemd" \
    --after-install /tmp/scripts/postinst \
    --before-remove /tmp/scripts/prerm \
    --after-remove /tmp/scripts/postrm \
    -p /packages/deb/logcorrelator_${VERSION}_${ARCH}.deb \
    usr/bin/logcorrelator \
    etc/logcorrelator/logcorrelator.conf \
    usr/share/logcorrelator/logcorrelator.conf.example \
    var/log/logcorrelator \
    var/run/logcorrelator
 # Build RPM package
 ARG DIST=el8
 RUN mkdir -p /packages/rpm && \
    fpm -s dir -t rpm \
    -n logcorrelator \
    -v "${VERSION}" \
    -C /tmp/pkgroot \
    --architecture "x86_64" \
    --description "Log correlation service for HTTP and network events" \
    --url "https://github.com/logcorrelator/logcorrelator" \
    --license "MIT" \
    --vendor "logcorrelator <dev@example.com>" \
    --depends "systemd" \
    --after-install /tmp/scripts/postinst \
    --before-remove /tmp/scripts/prerm \
    --after-remove /tmp/scripts/postrm \
    -p /packages/rpm/logcorrelator-${VERSION}-1.x86_64.rpm \
    usr/bin/logcorrelator \
    etc/logcorrelator/logcorrelator.conf \
    usr/share/logcorrelator/logcorrelator.conf.example \
    var/log/logcorrelator \
    var/run/logcorrelator
 # =============================================================================
 # Stage 3: Output - Image finale avec les packages
 # =============================================================================
 FROM alpine:latest AS output
 WORKDIR /packages
 COPY --from=package-builder /packages/deb/*.deb /packages/deb/
 COPY --from=package-builder /packages/rpm/*.rpm /packages/rpm/
 CMD ["sh", "-c", "echo '=== DEB Packages ===' && ls -la /packages/deb/ && echo '' && echo '=== RPM Packages ===' && ls -la /packages/rpm/"]
--- a/README.md
+++ b/README.md
@ -0,0 +1,278 @@
 # logcorrelator
 Service de corrélation de logs HTTP et réseau écrit en Go.
 ## Description
 **logcorrelator** reçoit deux flux de logs JSON via des sockets Unix :
 - **Source A** : logs HTTP applicatifs (Apache, reverse proxy)
 - **Source B** : logs réseau (métadonnées IP/TCP, JA3/JA4, etc.)
 Il corrèle les événements sur la base de `src_ip + src_port` avec une fenêtre temporelle configurable, et produit des logs corrélés vers :
 - Un fichier local (JSON lines)
 - ClickHouse (pour analyse et archivage)
 ## Architecture
 ```
 ┌─────────────────┐     ┌──────────────────┐     ┌─────────────────┐
 │  Apache Source  │────▶│                  │────▶│   File Sink     │
 │  (Unix Socket)  │     │  Correlation     │     │   (JSON lines)  │
 └─────────────────┘     │  Service         │     └─────────────────┘
                        │                  │
 ┌─────────────────┐     │  - Buffers       │     ┌─────────────────┐
 │  Network Source │────▶│  - Time Window   │────▶│  ClickHouse     │
 │  (Unix Socket)  │     │  - Orphan Policy │     │  Sink           │
 └─────────────────┘     └──────────────────┘     └─────────────────┘
 ```
 ## Build (100% Docker)
 Tout le build et les tests s'exécutent dans des containers Docker :
 ```bash
 # Build complet (binaire + tests + RPM)
 ./build.sh
 # Uniquement les tests
 ./test.sh
 # Build manuel avec Docker
 docker build --target builder -t logcorrelator-builder .
 docker build --target runtime -t logcorrelator:latest .
 ```
 ### Prérequis
 - Docker 20.10+
 - Bash
 ## Installation
 ### Depuis Docker
 ```bash
 # Build de l'image
 ./build.sh
 # Exécuter
 docker run -d \
    --name logcorrelator \
    -v /var/run/logcorrelator:/var/run/logcorrelator \
    -v /var/log/logcorrelator:/var/log/logcorrelator \
    -v ./config.conf:/etc/logcorrelator/logcorrelator.conf \
    logcorrelator:latest
 ```
 ### Depuis le package RPM (Rocky Linux 8+)
 ```bash
 # Générer le RPM
 ./build.sh
 # Installer le package
 sudo rpm -ivh dist/logcorrelator-1.0.0.rpm
 # Activer et démarrer le service
 sudo systemctl enable logcorrelator
 sudo systemctl start logcorrelator
 # Vérifier le statut
 sudo systemctl status logcorrelator
 ```
 ### Build manuel (sans Docker)
 ```bash
 # Prérequis: Go 1.21+
 go build -o logcorrelator ./cmd/logcorrelator
 # Exécuter
 ./logcorrelator -config config.example.conf
 ```
 ## Configuration
 La configuration utilise un fichier texte simple avec des directives :
 ```bash
 # Format: directive value [value...]
 # Lignes starting with # sont des commentaires
 service.name logcorrelator
 service.language go
 # Inputs (au moins 2 requis)
 input.unix_socket apache_source /var/run/logcorrelator/apache.sock json
 input.unix_socket network_source /var/run/logcorrelator/network.sock json
 # Outputs
 output.file.enabled true
 output.file.path /var/log/logcorrelator/correlated.log
 output.clickhouse.enabled false
 output.clickhouse.dsn clickhouse://user:pass@localhost:9000/db
 output.clickhouse.table correlated_logs_http_network
 output.clickhouse.batch_size 500
 output.clickhouse.flush_interval_ms 200
 # Corrélation
 correlation.key src_ip,src_port
 correlation.time_window.value 1
 correlation.time_window.unit s
 # Politique des orphelins
 correlation.orphan_policy.apache_always_emit true
 correlation.orphan_policy.network_emit false
 ```
 ### Directives disponibles
 | Directive | Description | Défaut |
 |-----------|-------------|--------|
 | `service.name` | Nom du service | `logcorrelator` |
 | `service.language` | Langage | `go` |
 | `input.unix_socket` | Socket Unix (name path [format]) | Requis |
 | `output.file.enabled` | Activer sortie fichier | `true` |
 | `output.file.path` | Chemin fichier | `/var/log/logcorrelator/correlated.log` |
 | `output.clickhouse.enabled` | Activer ClickHouse | `false` |
 | `output.clickhouse.dsn` | DSN ClickHouse | - |
 | `output.clickhouse.table` | Table ClickHouse | - |
 | `output.clickhouse.batch_size` | Taille batch | `500` |
 | `output.clickhouse.flush_interval_ms` | Intervalle flush | `200` |
 | `output.clickhouse.max_buffer_size` | Buffer max | `5000` |
 | `output.clickhouse.drop_on_overflow` | Drop si overflow | `true` |
 | `output.stdout.enabled` | Sortie stdout (debug) | `false` |
 | `correlation.key` | Clés de corrélation | `src_ip,src_port` |
 | `correlation.time_window.value` | Valeur fenêtre | `1` |
 | `correlation.time_window.unit` | Unité (ms/s/m) | `s` |
 | `correlation.orphan_policy.apache_always_emit` | Émettre A seul | `true` |
 | `correlation.orphan_policy.network_emit` | Émettre B seul | `false` |
 ## Format des logs
 ### Source A (HTTP)
 ```json
 {
  "src_ip": "192.168.1.1",
  "src_port": 8080,
  "dst_ip": "10.0.0.1",
  "dst_port": 80,
  "timestamp": 1704110400000000000,
  "method": "GET",
  "path": "/api/test",
  "header_host": "example.com"
 }
 ```
 ### Source B (Réseau)
 ```json
 {
  "src_ip": "192.168.1.1",
  "src_port": 8080,
  "dst_ip": "10.0.0.1",
  "dst_port": 443,
  "ja3": "abc123def456",
  "ja4": "xyz789"
 }
 ```
 ### Log corrélé (sortie)
 ```json
 {
  "timestamp": "2024-01-01T12:00:00Z",
  "src_ip": "192.168.1.1",
  "src_port": 8080,
  "dst_ip": "10.0.0.1",
  "dst_port": 80,
  "correlated": true,
  "apache": {"method": "GET", "path": "/api/test"},
  "network": {"ja3": "abc123def456"}
 }
 ```
 ## Schema ClickHouse
 ```sql
 CREATE TABLE correlated_logs_http_network (
    timestamp DateTime64(9),
    src_ip String,
    src_port UInt32,
    dst_ip String,
    dst_port UInt32,
    correlated UInt8,
    orphan_side String,
    apache JSON,
    network JSON
 ) ENGINE = MergeTree()
 ORDER BY (timestamp, src_ip, src_port);
 ```
 ## Tests
 ```bash
 # Via Docker
 ./test.sh
 # Local
 go test ./...
 go test -cover ./...
 go test -coverprofile=coverage.out ./...
 go tool cover -html=coverage.out
 ```
 ## Signaux
 | Signal | Comportement |
 |--------|--------------|
 | `SIGINT` | Arrêt gracieux |
 | `SIGTERM` | Arrêt gracieux |
 Lors de l'arrêt gracieux :
 1. Fermeture des sockets Unix
 2. Flush des buffers
 3. Émission des événements en attente
 4. Fermeture des connexions ClickHouse
 ## Logs internes
 Les logs internes sont envoyés vers stderr :
 ```bash
 # Docker
 docker logs -f logcorrelator
 # Systemd
 journalctl -u logcorrelator -f
 ```
 ## Structure du projet
 ```
 .
 ├── cmd/logcorrelator/       # Point d'entrée
 ├── internal/
 │   ├── adapters/
 │   │   ├── inbound/unixsocket/
 │   │   └── outbound/
 │   │       ├── clickhouse/
 │   │       ├── file/
 │   │       └── multi/
 │   ├── app/                 # Orchestration
 │   ├── config/              # Configuration
 │   ├── domain/              # Domaine (corrélation)
 │   ├── observability/       # Logging
 │   └── ports/               # Interfaces
 ├── config.example.conf      # Exemple de config
 ├── Dockerfile               # Build multi-stage
 ├── build.sh                 # Script de build
 ├── test.sh                  # Script de tests
 └── logcorrelator.service    # Unité systemd
 ```
 ## License
 MIT
--- a/architecture.yml
+++ b/architecture.yml
@ -0,0 +1,521 @@
 service:
  name: logcorrelator
  context: http-network-correlation
  language: go
  pattern: hexagonal
  description: >
    logcorrelator est un service système (lancé par systemd) écrit en Go, chargé
    de recevoir deux flux de logs JSON via des sockets Unix, de corréler les
    événements HTTP applicatifs (source A, typiquement Apache ou reverse proxy)
    avec des événements réseau (source B, métadonnées IP/TCP, JA3/JA4, etc.)
    sur la base de la combinaison strictement définie src_ip + src_port, avec
    une fenêtre temporelle configurable. Le service produit un log corrélé
    unique pour chaque paire correspondante, émet toujours les événements A
    même lorsqu’aucun événement B corrélé n’est disponible, n’émet jamais de
    logs B seuls, et pousse les logs agrégés en temps quasi réel vers
    ClickHouse et/ou un fichier local, en minimisant la rétention en mémoire
    et sur disque.
 runtime:
  deployment:
    unit_type: systemd
    description: >
      logcorrelator est livré sous forme de binaire autonome, exécuté comme un
      service systemd. L’unité systemd assure le démarrage automatique au boot,
      le redémarrage en cas de crash, et une intégration standard dans l’écosystème
      Linux (notamment sur Rocky Linux 8+).
    binary_path: /usr/bin/logcorrelator
    config_path: /etc/logcorrelator/logcorrelator.toml
    user: logcorrelator
    group: logcorrelator
    restart: on-failure
    systemd_unit:
      path: /etc/systemd/system/logcorrelator.service
      content_example: |
        [Unit]
        Description=logcorrelator service
        After=network.target
        [Service]
        Type=simple
        User=logcorrelator
        Group=logcorrelator
        ExecStart=/usr/bin/logcorrelator -config /etc/logcorrelator/logcorrelator.toml
        Restart=on-failure
        RestartSec=5
        [Install]
        WantedBy=multi-user.target
  os:
    supported:
      - rocky-linux-8+
      - rocky-linux-9+
      - autres-linux-recentes
  logs:
    stdout_stderr: journald
    structured: true
    description: >
      Les logs internes du service (erreurs, messages d’information) sont envoyés
      vers stdout/stderr et collectés par journald. Ils sont structurés et ne
      contiennent pas de données personnelles.
  signals:
    graceful_shutdown:
      - SIGINT
      - SIGTERM
    description: >
      En réception de SIGINT ou SIGTERM, le service arrête proprement la lecture
      des sockets Unix, vide les buffers d’envoi (dans les limites de la politique
      de drop), ferme les connexions ClickHouse puis s’arrête.
 config:
  format: toml
  location: /etc/logcorrelator/logcorrelator.toml
  description: >
    Toute la configuration est centralisée dans un fichier TOML lisible, stocké
    dans /etc/logcorrelator. Ni YAML ni JSON ne sont utilisés pour la config.
  reload_strategy: restart_service
  example: |
    [service]
    name = "logcorrelator"
    language = "go"
    [[inputs.unix_sockets]]
    name = "apache_source"
    path = "/var/run/logcorrelator/apache.sock"
    format = "json"
    [[inputs.unix_sockets]]
    name = "network_source"
    path = "/var/run/logcorrelator/network.sock"
    format = "json"
    [outputs.file]
    enabled = true
    path = "/var/log/logcorrelator/correlated.log"
    [outputs.clickhouse]
    enabled = true
    dsn = "clickhouse://user:pass@host:9000/db"
    table = "correlated_logs_http_network"
    batch_size = 500
    flush_interval_ms = 200
    max_buffer_size = 5000
    drop_on_overflow = true
    async_insert = true
    [correlation]
    key = ["src_ip", "src_port"]
    [correlation.time_window]
    value = 1
    unit = "s"
    [correlation.orphan_policy]
    apache_always_emit = true
    network_emit = false
 inputs:
  description: >
    Le service consomme deux flux de logs JSON via des sockets Unix. Le schéma
    exact des logs pour chaque source est flexible et peut évoluer. Seuls
    quelques champs sont nécessaires pour la corrélation.
  unix_sockets:
    - name: apache_source
      id: A
      description: >
        Source A, destinée aux logs HTTP applicatifs (Apache, reverse proxy, etc.).
        Le schéma JSON est variable, avec un champ timestamp numérique obligatoire
        et des champs header_* dynamiques.
      path: /var/run/logcorrelator/apache.sock
      protocol: unix
      mode: stream
      format: json
      framing: line
      retry_on_error: true
    - name: network_source
      id: B
      description: >
        Source B, destinée aux logs réseau (métadonnées IP/TCP, JA3/JA4, etc.).
        Le schéma JSON est variable ; seuls src_ip et src_port sont requis.
      path: /var/run/logcorrelator/network.sock
      protocol: unix
      mode: stream
      format: json
      framing: line
      retry_on_error: true
 outputs:
  description: >
    Les logs corrélés sont envoyés vers un ou plusieurs sinks. MultiSink permet
    de diffuser chaque log corrélé vers plusieurs destinations (fichier,
    ClickHouse, stdout…).
  sinks:
    file:
      enabled: true
      description: >
        Sink vers fichier local, utile pour debug ou archivage local. Écrit un
        JSON par ligne dans le chemin configuré. Rotation gérée par logrotate
        ou équivalent.
      path: /var/log/logcorrelator/correlated.log
      format: json_lines
      rotate_managed_by: external
    clickhouse:
      enabled: true
      description: >
        Sink principal pour l’archivage et l’analyse en temps quasi réel. Les
        logs corrélés sont insérés en batch dans ClickHouse avec un small buffer
        et des inserts asynchrones. En cas de saturation ou d’indisponibilité
        ClickHouse, les logs sont drop pour éviter de saturer la machine locale.
      dsn: clickhouse://user:pass@host:9000/db
      table: correlated_logs_http_network
      batch_size: 500
      flush_interval_ms: 200
      max_buffer_size: 5000
      drop_on_overflow: true
      async_insert: true
      timeout_ms: 1000
    stdout:
      enabled: false
      description: >
        Sink optionnel vers stdout pour les tests et le développement.
 correlation:
  description: >
    Corrélation strictement basée sur src_ip + src_port et une fenêtre temporelle
    configurable. Aucun autre champ (dst_ip, dst_port, JA3/JA4, headers HTTP...)
    n’est utilisé pour la décision de corrélation.
  key:
    - src_ip
    - src_port
  time_window:
    value: 1
    unit: s
    description: >
      Fenêtre de temps symétrique appliquée aux timestamps de A et B. Deux
      événements sont corrélés si |tA - tB| <= time_window. La valeur et l’unité
      sont définies dans le TOML.
  timestamp_source:
    apache: field_timestamp
    network: reception_time
    description: >
      Pour A, utilisation du champ numérique "timestamp" (epoch ns). Pour B,
      utilisation du temps de réception local.
  orphan_policy:
    apache_always_emit: true
    network_emit: false
    description: >
      A est toujours émis (même sans B) avec correlated=false et orphan_side="A".
      B n’est jamais émis seul.
  matching:
    mode: one_to_one_first_match
    description: >
      Stratégie 1‑à‑1, premier match : lors de l’arrivée d’un événement, on
      cherche le premier événement compatible dans le buffer de l’autre source.
      Les autres restent en attente ou expirent.
 schema:
  description: >
    Les schémas des sources A et B sont variables. Le service impose seulement
    quelques champs obligatoires nécessaires à la corrélation et accepte des
    champs supplémentaires sans modification de code.
  source_A:
    description: >
      Logs HTTP applicatifs (Apache/reverse proxy) au format JSON. Schéma
      variable, avec champs obligatoires pour corrélation (src_ip, src_port,
      timestamp) et collecte des autres champs dans des maps.
    required_fields:
      - name: src_ip
        type: string
        description: Adresse IP source client.
      - name: src_port
        type: int
        description: Port source client.
      - name: timestamp
        type: int64
        unit: ns
        description: Timestamp de référence pour la corrélation.
    optional_fields:
      - name: time
        type: string
        format: rfc3339
      - name: dst_ip
        type: string
      - name: dst_port
        type: int
      - name: method
        type: string
      - name: path
        type: string
      - name: host
        type: string
      - name: http_version
        type: string
    dynamic_fields:
      - pattern: header_*
        target_map: headers
        description: >
          Tous les champs header_* sont collectés dans headers[clé] = valeur.
      - pattern: "*"
        target_map: extra
        description: >
          Tous les champs non reconnus explicitement vont dans extra.
  source_B:
    description: >
      Logs réseau JSON (IP/TCP, JA3/JA4...). Schéma variable. src_ip et src_port
      sont obligatoires pour la corrélation, le reste est libre.
    required_fields:
      - name: src_ip
        type: string
      - name: src_port
        type: int
    optional_fields:
      - name: dst_ip
        type: string
      - name: dst_port
        type: int
    dynamic_fields:
      - pattern: "*"
        target_map: extra
        description: >
          Tous les autres champs (ip_meta_*, tcp_meta_*, ja3, ja4, etc.) sont
          rangés dans extra.
  normalized_event:
    description: >
      Représentation interne unifiée des événements A/B sur laquelle opère la
      logique de corrélation.
    fields:
      - name: source
        type: enum("A","B")
      - name: timestamp
        type: time.Time
      - name: src_ip
        type: string
      - name: src_port
        type: int
      - name: dst_ip
        type: string
        optional: true
      - name: dst_port
        type: int
        optional: true
      - name: headers
        type: map[string]string
        optional: true
      - name: extra
        type: map[string]any
        description: Champs additionnels provenant de A ou B.
  correlated_log:
    description: >
      Structure du log corrélé émis vers les sinks (fichier, ClickHouse). Contient
      les informations de corrélation, les infos communes et les contenus de A/B.
    fields:
      - name: timestamp
        type: time.Time
      - name: src_ip
        type: string
      - name: src_port
        type: int
      - name: dst_ip
        type: string
        optional: true
      - name: dst_port
        type: int
        optional: true
      - name: correlated
        type: bool
      - name: orphan_side
        type: string
      - name: apache
        type: map[string]any
        optional: true
      - name: network
        type: map[string]any
        optional: true
      - name: extra
        type: map[string]any
        description: Champs dérivés éventuels.
 clickhouse_schema:
  strategy: external_ddls
  description: >
    logcorrelator ne gère pas les ALTER TABLE. La table ClickHouse doit être
    créée/modifiée en dehors du service. logcorrelator remplit les colonnes
    existantes qu’il connaît et met NULL si un champ manque.
  base_columns:
    - name: timestamp
      type: DateTime64(9)
    - name: src_ip
      type: String
    - name: src_port
      type: UInt32
    - name: dst_ip
      type: String
    - name: dst_port
      type: UInt32
    - name: correlated
      type: UInt8
    - name: orphan_side
      type: String
    - name: apache
      type: JSON
    - name: network
      type: JSON
  dynamic_fields:
    mode: map_or_additional_columns
    description: >
      Les champs dynamiques peuvent être exposés via colonnes dédiées créées par
      migration, ou via Map/JSON.
 architecture:
  description: >
    Architecture hexagonale : domaine de corrélation indépendant, ports
    abstraits pour les sources/sinks, adaptateurs pour sockets Unix, fichier et
    ClickHouse, couche application d’orchestration, et modules infra pour
    config/observabilité.
  modules:
    - name: cmd/logcorrelator
      type: entrypoint
      responsibilities:
        - Chargement configuration TOML.
        - Initialisation des adaptateurs d’entrée/sortie.
        - Création du CorrelationService.
        - Démarrage de l’orchestrateur.
        - Gestion du cycle de vie (signaux systemd).
    - name: internal/domain
      type: domain
      responsibilities:
        - Modèles NormalizedEvent et CorrelatedLog.
        - Implémentation de CorrelationService (buffers, fenêtre,
          orphelins).
    - name: internal/ports
      type: ports
      responsibilities:
        - EventSource, CorrelatedLogSink, TimeProvider.
    - name: internal/app
      type: application
      responsibilities:
        - Orchestrator : relier EventSource → CorrelationService → MultiSink.
    - name: internal/adapters/inbound/unixsocket
      type: adapter_inbound
      responsibilities:
        - Lecture sockets Unix + parsing JSON → NormalizedEvent.
    - name: internal/adapters/outbound/file
      type: adapter_outbound
      responsibilities:
        - Écriture fichier JSON lines.
    - name: internal/adapters/outbound/clickhouse
      type: adapter_outbound
      responsibilities:
        - Bufferisation + inserts batch vers ClickHouse.
        - Application de drop_on_overflow.
    - name: internal/adapters/outbound/multi
      type: adapter_outbound
      responsibilities:
        - Fan-out vers plusieurs sinks.
    - name: internal/config
      type: infrastructure
      responsibilities:
        - Chargement/validation config TOML.
    - name: internal/observability
      type: infrastructure
      responsibilities:
        - Logging et métriques internes.
 testing:
  unit:
    description: >
      Tests unitaires table-driven avec couverture cible ≥ 80 %. Focalisés sur
      la logique de corrélation, parsing et sink ClickHouse.[web:94][web:98][web:102]
    coverage_minimum: 0.8
    focus:
      - CorrelationService
      - Parsing A/B → NormalizedEvent
      - ClickHouseSink (batching, overflow)
      - MultiSink
  integration:
    description: >
      Tests d’intégration validant le flux complet A+B → corrélation → sinks,
      avec sockets simulés et ClickHouse mocké.
 docker:
  description: >
    Build et tests entièrement encapsulés dans Docker, avec multi‑stage build :
    un stage builder pour compiler et tester, un stage runtime minimal pour
    exécuter le service.[web:95][web:103]
  images:
    builder:
      base: golang:latest
      purpose: build_and_test
    runtime:
      base: gcr.io/distroless/base-debian12
      purpose: run_binary_only
  build:
    multi_stage: true
    steps:
      - name: unit_tests
        description: >
          go test ./... avec génération de couverture. Le build échoue si la
          couverture est < 80 %.
      - name: compile_binary
        description: >
          Compilation CGO_ENABLED=0, GOOS=linux, GOARCH=amd64 pour un binaire
          statique /usr/bin/logcorrelator.
      - name: assemble_runtime_image
        description: >
          Copie du binaire dans l’image runtime et définition de l’ENTRYPOINT.
 packaging:
  description: >
    logcorrelator doit être distribué en package .rpm pour Rocky Linux (8+),
    construit intégralement dans Docker à partir du binaire compilé.[web:96][web:99][web:101]
  formats:
    - rpm
  target_distros:
    - rocky-linux-8+
    - rocky-linux-9+
  tool: fpm
  build_pipeline:
    steps:
      - name: build_binary_in_docker
        description: >
          Utiliser l’image builder pour compiler logcorrelator et installer le
          binaire dans un répertoire de staging (par ex. /tmp/pkgroot/usr/bin/logcorrelator).
      - name: prepare_filesystem_layout
        description: >
          Créer la hiérarchie :
          - /usr/bin/logcorrelator
          - /etc/logcorrelator/logcorrelator.toml (exemple)
          - /etc/systemd/system/logcorrelator.service (unit)
          - /var/log/logcorrelator (répertoire de logs)
      - name: run_fpm_in_docker
        description: >
          Lancer un conteneur fpm (par ex. image ruby:fpm) avec montage de
          /tmp/pkgroot, et exécuter fpm -s dir -t rpm pour générer le .rpm
          compatible Rocky Linux.
      - name: verify_rpm_on_rocky
        description: >
          Tester l’installation et le démarrage du service dans un conteneur
          Rocky Linux 8/9 (docker run --rm -it rockylinux:8), en installant le
          .rpm, en activant le service systemd et en vérifiant qu’il démarre
          correctement.
 non_functional:
  performance:
    target_latency_ms: 1000
    description: >
      Latence visée < 1 s entre réception et insertion ClickHouse, avec
      batching léger.
  reliability:
    drop_on_clickhouse_failure: true
    description: >
      En cas de ClickHouse lent/HS, les logs sont drop au‑delà du buffer pour
      protéger la machine.
  security:
    user_separation: true
    privileges: least
    description: >
      Service sous utilisateur dédié, pas de secrets en clair dans les logs,
      principe de moindre privilège.
--- a/build.sh
+++ b/build.sh
@ -0,0 +1,75 @@
 #!/bin/bash
 # Build script - everything runs in Docker containers
 set -e
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 cd "$SCRIPT_DIR"
 VERSION="${VERSION:-1.0.0}"
 OUTPUT_DIR="${SCRIPT_DIR}/dist"
 echo "=============================================="
 echo "  logcorrelator - Docker Build Pipeline"
 echo "=============================================="
 echo ""
 # Create output directory
 mkdir -p "${OUTPUT_DIR}"
 # Step 1: Build and test
 echo "[1/4] Building and running tests in container..."
 docker build \
    --target builder \
    -t logcorrelator-builder:latest \
    -f Dockerfile .
 # Step 2: Build runtime image
 echo "[2/4] Building runtime image..."
 docker build \
    --target runtime \
    -t logcorrelator:${VERSION} \
    -t logcorrelator:latest \
    -f Dockerfile .
 # Step 3: Build packages (DEB + RPM)
 echo "[3/4] Building DEB and RPM packages in container..."
 docker build \
    --target output \
    --build-arg VERSION="${VERSION}" \
    -t logcorrelator-packager:latest \
    -f Dockerfile.package .
 # Extract packages from builder container
 echo "[4/4] Extracting packages..."
 mkdir -p "${OUTPUT_DIR}/deb" "${OUTPUT_DIR}/rpm"
 docker run --rm -v "${OUTPUT_DIR}:/output" logcorrelator-packager:latest \
    sh -c 'cp -r /packages/deb /output/ && cp -r /packages/rpm /output/'
 echo ""
 echo "=============================================="
 echo "  Build Complete!"
 echo "=============================================="
 echo ""
 echo "Artifacts:"
 echo "  - Runtime image: logcorrelator:${VERSION}"
 echo "  - DEB package:   ${OUTPUT_DIR}/deb/logcorrelator_${VERSION}_amd64.deb"
 echo "  - RPM package:   ${OUTPUT_DIR}/rpm/logcorrelator-${VERSION}-1.x86_64.rpm"
 echo ""
 echo "Usage:"
 echo "  # Run with Docker:"
 echo "  docker run -d --name logcorrelator \\"
 echo "    -v /var/run/logcorrelator:/var/run/logcorrelator \\"
 echo "    -v /var/log/logcorrelator:/var/log/logcorrelator \\"
 echo "    -v ./config.conf:/etc/logcorrelator/logcorrelator.conf \\"
 echo "    logcorrelator:latest"
 echo ""
 echo "  # Install DEB on Debian/Ubuntu:"
 echo "  sudo dpkg -i ${OUTPUT_DIR}/deb/logcorrelator_${VERSION}_amd64.deb"
 echo "  sudo systemctl enable logcorrelator"
 echo "  sudo systemctl start logcorrelator"
 echo ""
 echo "  # Install RPM on Rocky Linux:"
 echo "  sudo rpm -ivh ${OUTPUT_DIR}/rpm/logcorrelator-${VERSION}-1.x86_64.rpm"
 echo "  sudo systemctl enable logcorrelator"
 echo "  sudo systemctl start logcorrelator"
 echo ""
--- a/config.example.conf
+++ b/config.example.conf
@ -0,0 +1,41 @@
 # logcorrelator configuration file
 # Format: directive value [value...]
 # Lines starting with # are comments
 # Service configuration
 service.name logcorrelator
 service.language go
 # Input sources (at least 2 required)
 # Format: input.unix_socket <name> <path> [format]
 input.unix_socket apache_source /var/run/logcorrelator/apache.sock json
 input.unix_socket network_source /var/run/logcorrelator/network.sock json
 # File output
 output.file.enabled true
 output.file.path /var/log/logcorrelator/correlated.log
 # ClickHouse output
 output.clickhouse.enabled false
 output.clickhouse.dsn clickhouse://user:pass@localhost:9000/db
 output.clickhouse.table correlated_logs_http_network
 output.clickhouse.batch_size 500
 output.clickhouse.flush_interval_ms 200
 output.clickhouse.max_buffer_size 5000
 output.clickhouse.drop_on_overflow true
 output.clickhouse.async_insert true
 output.clickhouse.timeout_ms 1000
 # Stdout output (for debugging)
 output.stdout.enabled false
 # Correlation configuration
 correlation.key src_ip,src_port
 correlation.time_window.value 1
 correlation.time_window.unit s
 # Orphan policy
 # apache_always_emit: always emit A events even without matching B
 # network_emit: emit B events alone (usually false)
 correlation.orphan_policy.apache_always_emit true
 correlation.orphan_policy.network_emit false
--- a/go.mod
+++ b/go.mod
@ -0,0 +1,3 @@
 module github.com/logcorrelator/logcorrelator
 go 1.21
--- a/go.sum
+++ b/go.sum
--- a/internal/adapters/inbound/unixsocket/source.go
+++ b/internal/adapters/inbound/unixsocket/source.go
@ -0,0 +1,334 @@
 package unixsocket
 import (
 	"bufio"
 	"context"
 	"encoding/json"
 	"fmt"
 	"net"
 	"os"
 	"strconv"
 	"strings"
 	"sync"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 const (
 	// Default socket file permissions (owner + group read/write)
 	DefaultSocketPermissions os.FileMode = 0660
 	// Maximum line size for JSON logs (1MB)
 	MaxLineSize = 1024 * 1024
 	// Maximum concurrent connections per socket
 	MaxConcurrentConnections = 100
 	// Rate limit: max events per second
 	MaxEventsPerSecond = 10000
 )
 // Config holds the Unix socket source configuration.
 type Config struct {
 	Name string
 	Path string
 }
 // UnixSocketSource reads JSON events from a Unix socket.
 type UnixSocketSource struct {
 	config    Config
 	mu        sync.Mutex
 	listener  net.Listener
 	done      chan struct{}
 	wg        sync.WaitGroup
 	semaphore chan struct{} // Limit concurrent connections
 }
 // NewUnixSocketSource creates a new Unix socket source.
 func NewUnixSocketSource(config Config) *UnixSocketSource {
 	return &UnixSocketSource{
 		config:    config,
 		done:      make(chan struct{}),
 		semaphore: make(chan struct{}, MaxConcurrentConnections),
 	}
 }
 // Name returns the source name.
 func (s *UnixSocketSource) Name() string {
 	return s.config.Name
 }
 // Start begins listening on the Unix socket.
 func (s *UnixSocketSource) Start(ctx context.Context, eventChan chan<- *domain.NormalizedEvent) error {
 	// Remove existing socket file if present
 	if info, err := os.Stat(s.config.Path); err == nil {
 		if info.Mode()&os.ModeSocket != 0 {
 			if err := os.Remove(s.config.Path); err != nil {
 				return fmt.Errorf("failed to remove existing socket: %w", err)
 			}
 		} else {
 			return fmt.Errorf("path exists but is not a socket: %s", s.config.Path)
 		}
 	}
 	// Create listener
 	listener, err := net.Listen("unix", s.config.Path)
 	if err != nil {
 		return fmt.Errorf("failed to create unix socket listener: %w", err)
 	}
 	s.listener = listener
 	// Set permissions - fail if we can't
 	if err := os.Chmod(s.config.Path, DefaultSocketPermissions); err != nil {
 		listener.Close()
 		os.Remove(s.config.Path)
 		return fmt.Errorf("failed to set socket permissions: %w", err)
 	}
 	s.wg.Add(1)
 	go func() {
 		defer s.wg.Done()
 		s.acceptConnections(ctx, eventChan)
 	}()
 	return nil
 }
 func (s *UnixSocketSource) acceptConnections(ctx context.Context, eventChan chan<- *domain.NormalizedEvent) {
 	for {
 		select {
 		case <-s.done:
 			return
 		case <-ctx.Done():
 			return
 		default:
 		}
 		conn, err := s.listener.Accept()
 		if err != nil {
 			select {
 			case <-s.done:
 				return
 			case <-ctx.Done():
 				return
 			default:
 				continue
 			}
 		}
 		// Check semaphore for connection limiting
 		select {
 		case s.semaphore <- struct{}{}:
 			// Connection accepted
 		default:
 			// Too many connections, reject
 			conn.Close()
 			continue
 		}
 		s.wg.Add(1)
 		go func(c net.Conn) {
 			defer s.wg.Done()
 			defer func() { <-s.semaphore }()
 			defer c.Close()
 			s.readEvents(ctx, c, eventChan)
 		}(conn)
 	}
 }
 func (s *UnixSocketSource) readEvents(ctx context.Context, conn net.Conn, eventChan chan<- *domain.NormalizedEvent) {
 	// Set read deadline to prevent hanging
 	conn.SetReadDeadline(time.Now().Add(5 * time.Minute))
 	scanner := bufio.NewScanner(conn)
 	// Increase buffer size limit to 1MB
 	buf := make([]byte, 0, 4096)
 	scanner.Buffer(buf, MaxLineSize)
 	for scanner.Scan() {
 		select {
 		case <-ctx.Done():
 			return
 		default:
 		}
 		line := scanner.Bytes()
 		if len(line) == 0 {
 			continue
 		}
 		event, err := parseJSONEvent(line)
 		if err != nil {
 			// Log parse errors but continue processing
 			continue
 		}
 		select {
 		case eventChan <- event:
 		case <-ctx.Done():
 			return
 		}
 	}
 	if err := scanner.Err(); err != nil {
 		// Connection error, log but don't crash
 	}
 }
 func parseJSONEvent(data []byte) (*domain.NormalizedEvent, error) {
 	var raw map[string]any
 	if err := json.Unmarshal(data, &raw); err != nil {
 		return nil, fmt.Errorf("invalid JSON: %w", err)
 	}
 	event := &domain.NormalizedEvent{
 		Raw:   raw,
 		Extra: make(map[string]any),
 	}
 	// Extract and validate src_ip
 	if v, ok := getString(raw, "src_ip"); ok {
 		event.SrcIP = v
 	} else {
 		return nil, fmt.Errorf("missing required field: src_ip")
 	}
 	// Extract and validate src_port
 	if v, ok := getInt(raw, "src_port"); ok {
 		if v < 1 || v > 65535 {
 			return nil, fmt.Errorf("src_port must be between 1 and 65535, got %d", v)
 		}
 		event.SrcPort = v
 	} else {
 		return nil, fmt.Errorf("missing required field: src_port")
 	}
 	// Extract dst_ip (optional)
 	if v, ok := getString(raw, "dst_ip"); ok {
 		event.DstIP = v
 	}
 	// Extract dst_port (optional)
 	if v, ok := getInt(raw, "dst_port"); ok {
 		if v < 0 || v > 65535 {
 			return nil, fmt.Errorf("dst_port must be between 0 and 65535, got %d", v)
 		}
 		event.DstPort = v
 	}
 	// Extract timestamp - try different fields
 	if ts, ok := getInt64(raw, "timestamp"); ok {
 		// Assume nanoseconds
 		event.Timestamp = time.Unix(0, ts)
 	} else if tsStr, ok := getString(raw, "time"); ok {
 		if t, err := time.Parse(time.RFC3339, tsStr); err == nil {
 			event.Timestamp = t
 		}
 	} else if tsStr, ok := getString(raw, "timestamp"); ok {
 		if t, err := time.Parse(time.RFC3339, tsStr); err == nil {
 			event.Timestamp = t
 		}
 	}
 	if event.Timestamp.IsZero() {
 		event.Timestamp = time.Now()
 	}
 	// Extract headers (header_* fields)
 	event.Headers = make(map[string]string)
 	for k, v := range raw {
 		if len(k) > 7 && k[:7] == "header_" {
 			if sv, ok := v.(string); ok {
 				event.Headers[k[7:]] = sv
 			}
 		}
 	}
 	// Determine source based on fields present
 	if len(event.Headers) > 0 {
 		event.Source = domain.SourceA
 	} else {
 		event.Source = domain.SourceB
 	}
 	// Extra fields (single pass)
 	knownFields := map[string]bool{
 		"src_ip": true, "src_port": true, "dst_ip": true, "dst_port": true,
 		"timestamp": true, "time": true,
 	}
 	for k, v := range raw {
 		if knownFields[k] {
 			continue
 		}
 		if strings.HasPrefix(k, "header_") {
 			continue
 		}
 		event.Extra[k] = v
 	}
 	return event, nil
 }
 func getString(m map[string]any, key string) (string, bool) {
 	if v, ok := m[key]; ok {
 		if s, ok := v.(string); ok {
 			return s, true
 		}
 	}
 	return "", false
 }
 func getInt(m map[string]any, key string) (int, bool) {
 	if v, ok := m[key]; ok {
 		switch val := v.(type) {
 		case float64:
 			return int(val), true
 		case int:
 			return val, true
 		case int64:
 			return int(val), true
 		case string:
 			if i, err := strconv.Atoi(val); err == nil {
 				return i, true
 			}
 		}
 	}
 	return 0, false
 }
 func getInt64(m map[string]any, key string) (int64, bool) {
 	if v, ok := m[key]; ok {
 		switch val := v.(type) {
 		case float64:
 			return int64(val), true
 		case int:
 			return int64(val), true
 		case int64:
 			return val, true
 		case string:
 			if i, err := strconv.ParseInt(val, 10, 64); err == nil {
 				return i, true
 			}
 		}
 	}
 	return 0, false
 }
 // Stop gracefully stops the source.
 func (s *UnixSocketSource) Stop() error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	close(s.done)
 	if s.listener != nil {
 		s.listener.Close()
 	}
 	s.wg.Wait()
 	// Clean up socket file
 	if err := os.Remove(s.config.Path); err != nil && !os.IsNotExist(err) {
 		return fmt.Errorf("failed to remove socket file: %w", err)
 	}
 	return nil
 }
--- a/internal/adapters/inbound/unixsocket/source_test.go
+++ b/internal/adapters/inbound/unixsocket/source_test.go
@ -0,0 +1,98 @@
 package unixsocket
 import (
 	"testing"
 	"time"
 )
 func TestParseJSONEvent_Apache(t *testing.T) {
 	data := []byte(`{
 		"src_ip": "192.168.1.1",
 		"src_port": 8080,
 		"dst_ip": "10.0.0.1",
 		"dst_port": 80,
 		"timestamp": 1704110400000000000,
 		"method": "GET",
 		"path": "/api/test",
 		"header_host": "example.com",
 		"header_user_agent": "Mozilla/5.0"
 	}`)
 	event, err := parseJSONEvent(data)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if event.SrcIP != "192.168.1.1" {
 		t.Errorf("expected src_ip 192.168.1.1, got %s", event.SrcIP)
 	}
 	if event.SrcPort != 8080 {
 		t.Errorf("expected src_port 8080, got %d", event.SrcPort)
 	}
 	if event.Headers["host"] != "example.com" {
 		t.Errorf("expected header host example.com, got %s", event.Headers["host"])
 	}
 	if event.Headers["user_agent"] != "Mozilla/5.0" {
 		t.Errorf("expected header_user_agent Mozilla/5.0, got %s", event.Headers["user_agent"])
 	}
 }
 func TestParseJSONEvent_Network(t *testing.T) {
 	data := []byte(`{
 		"src_ip": "192.168.1.1",
 		"src_port": 8080,
 		"dst_ip": "10.0.0.1",
 		"dst_port": 443,
 		"ja3": "abc123def456",
 		"ja4": "xyz789",
 		"tcp_meta_flags": "SYN"
 	}`)
 	event, err := parseJSONEvent(data)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if event.SrcIP != "192.168.1.1" {
 		t.Errorf("expected src_ip 192.168.1.1, got %s", event.SrcIP)
 	}
 	if event.Extra["ja3"] != "abc123def456" {
 		t.Errorf("expected ja3 abc123def456, got %v", event.Extra["ja3"])
 	}
 }
 func TestParseJSONEvent_InvalidJSON(t *testing.T) {
 	data := []byte(`{invalid json}`)
 	_, err := parseJSONEvent(data)
 	if err == nil {
 		t.Error("expected error for invalid JSON")
 	}
 }
 func TestParseJSONEvent_MissingFields(t *testing.T) {
 	data := []byte(`{"other_field": "value"}`)
 	_, err := parseJSONEvent(data)
 	if err == nil {
 		t.Error("expected error for missing src_ip/src_port")
 	}
 }
 func TestParseJSONEvent_StringTimestamp(t *testing.T) {
 	data := []byte(`{
 		"src_ip": "192.168.1.1",
 		"src_port": 8080,
 		"time": "2024-01-01T12:00:00Z"
 	}`)
 	event, err := parseJSONEvent(data)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	expected := time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC)
 	if !event.Timestamp.Equal(expected) {
 		t.Errorf("expected timestamp %v, got %v", expected, event.Timestamp)
 	}
 }
--- a/internal/adapters/outbound/clickhouse/sink.go
+++ b/internal/adapters/outbound/clickhouse/sink.go
@ -0,0 +1,333 @@
 package clickhouse
 import (
 	"context"
 	"database/sql"
 	"encoding/json"
 	"fmt"
 	"sync"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 const (
 	// DefaultBatchSize is the default number of records per batch
 	DefaultBatchSize = 500
 	// DefaultFlushIntervalMs is the default flush interval in milliseconds
 	DefaultFlushIntervalMs = 200
 	// DefaultMaxBufferSize is the default maximum buffer size
 	DefaultMaxBufferSize = 5000
 	// DefaultTimeoutMs is the default timeout for operations in milliseconds
 	DefaultTimeoutMs = 1000
 	// DefaultPingTimeoutMs is the timeout for initial connection ping
 	DefaultPingTimeoutMs = 5000
 	// MaxRetries is the maximum number of retry attempts for failed inserts
 	MaxRetries = 3
 	// RetryBaseDelay is the base delay between retries
 	RetryBaseDelay = 100 * time.Millisecond
 )
 // Config holds the ClickHouse sink configuration.
 type Config struct {
 	DSN             string
 	Table           string
 	BatchSize       int
 	FlushIntervalMs int
 	MaxBufferSize   int
 	DropOnOverflow  bool
 	AsyncInsert     bool
 	TimeoutMs       int
 }
 // ClickHouseSink writes correlated logs to ClickHouse.
 type ClickHouseSink struct {
 	config    Config
 	db        *sql.DB
 	mu        sync.Mutex
 	buffer    []domain.CorrelatedLog
 	flushChan chan struct{}
 	done      chan struct{}
 	wg        sync.WaitGroup
 }
 // NewClickHouseSink creates a new ClickHouse sink.
 func NewClickHouseSink(config Config) (*ClickHouseSink, error) {
 	// Apply defaults
 	if config.BatchSize <= 0 {
 		config.BatchSize = DefaultBatchSize
 	}
 	if config.FlushIntervalMs <= 0 {
 		config.FlushIntervalMs = DefaultFlushIntervalMs
 	}
 	if config.MaxBufferSize <= 0 {
 		config.MaxBufferSize = DefaultMaxBufferSize
 	}
 	if config.TimeoutMs <= 0 {
 		config.TimeoutMs = DefaultTimeoutMs
 	}
 	s := &ClickHouseSink{
 		config:    config,
 		buffer:    make([]domain.CorrelatedLog, 0, config.BatchSize),
 		flushChan: make(chan struct{}, 1),
 		done:      make(chan struct{}),
 	}
 	// Connect to ClickHouse
 	db, err := sql.Open("clickhouse", config.DSN)
 	if err != nil {
 		return nil, fmt.Errorf("failed to connect to ClickHouse: %w", err)
 	}
 	// Ping with timeout
 	pingCtx, pingCancel := context.WithTimeout(context.Background(), time.Duration(DefaultPingTimeoutMs)*time.Millisecond)
 	defer pingCancel()
 	if err := db.PingContext(pingCtx); err != nil {
 		db.Close()
 		return nil, fmt.Errorf("failed to ping ClickHouse: %w", err)
 	}
 	s.db = db
 	// Start flush goroutine
 	s.wg.Add(1)
 	go s.flushLoop()
 	return s, nil
 }
 // Name returns the sink name.
 func (s *ClickHouseSink) Name() string {
 	return "clickhouse"
 }
 // Write adds a log to the buffer.
 func (s *ClickHouseSink) Write(ctx context.Context, log domain.CorrelatedLog) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	// Check buffer overflow
 	if len(s.buffer) >= s.config.MaxBufferSize {
 		if s.config.DropOnOverflow {
 			// Drop the log
 			return nil
 		}
 		// Block until space is available (with timeout)
 		select {
 		case <-ctx.Done():
 			return ctx.Err()
 		case <-time.After(time.Duration(s.config.TimeoutMs) * time.Millisecond):
 			return fmt.Errorf("buffer full, timeout exceeded")
 		}
 	}
 	s.buffer = append(s.buffer, log)
 	// Trigger flush if batch is full
 	if len(s.buffer) >= s.config.BatchSize {
 		select {
 		case s.flushChan <- struct{}{}:
 		default:
 		}
 	}
 	return nil
 }
 // Flush flushes the buffer to ClickHouse.
 func (s *ClickHouseSink) Flush(ctx context.Context) error {
 	return s.doFlush(ctx)
 }
 // Close closes the sink.
 func (s *ClickHouseSink) Close() error {
 	close(s.done)
 	s.wg.Wait()
 	if s.db != nil {
 		return s.db.Close()
 	}
 	return nil
 }
 func (s *ClickHouseSink) flushLoop() {
 	defer s.wg.Done()
 	ticker := time.NewTicker(time.Duration(s.config.FlushIntervalMs) * time.Millisecond)
 	defer ticker.Stop()
 	for {
 		select {
 		case <-s.done:
 			return
 		case <-ticker.C:
 			s.mu.Lock()
 			needsFlush := len(s.buffer) > 0
 			s.mu.Unlock()
 			if needsFlush {
 				// Use timeout context for flush
 				ctx, cancel := context.WithTimeout(context.Background(), time.Duration(s.config.TimeoutMs)*time.Millisecond)
 				s.doFlush(ctx)
 				cancel()
 			}
 		case <-s.flushChan:
 			s.mu.Lock()
 			needsFlush := len(s.buffer) >= s.config.BatchSize
 			s.mu.Unlock()
 			if needsFlush {
 				// Use timeout context for flush
 				ctx, cancel := context.WithTimeout(context.Background(), time.Duration(s.config.TimeoutMs)*time.Millisecond)
 				s.doFlush(ctx)
 				cancel()
 			}
 		}
 	}
 }
 func (s *ClickHouseSink) doFlush(ctx context.Context) error {
 	s.mu.Lock()
 	if len(s.buffer) == 0 {
 		s.mu.Unlock()
 		return nil
 	}
 	// Copy buffer to flush
 	buffer := make([]domain.CorrelatedLog, len(s.buffer))
 	copy(buffer, s.buffer)
 	s.buffer = make([]domain.CorrelatedLog, 0, s.config.BatchSize)
 	s.mu.Unlock()
 	// Prepare batch insert with retry
 	query := fmt.Sprintf(`
 		INSERT INTO %s (timestamp, src_ip, src_port, dst_ip, dst_port, correlated, orphan_side, apache, network)
 		VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
 	`, s.config.Table)
 	// Retry logic with exponential backoff
 	var lastErr error
 	for attempt := 0; attempt < MaxRetries; attempt++ {
 		if attempt > 0 {
 			// Exponential backoff
 			delay := RetryBaseDelay * time.Duration(1<<uint(attempt-1))
 			select {
 			case <-time.After(delay):
 			case <-ctx.Done():
 				return ctx.Err()
 			}
 		}
 		lastErr = s.executeBatch(ctx, query, buffer)
 		if lastErr == nil {
 			return nil // Success
 		}
 		// Check if error is retryable
 		if !isRetryableError(lastErr) {
 			return fmt.Errorf("non-retryable error: %w", lastErr)
 		}
 	}
 	return fmt.Errorf("failed after %d retries: %w", MaxRetries, lastErr)
 }
 func (s *ClickHouseSink) executeBatch(ctx context.Context, query string, buffer []domain.CorrelatedLog) error {
 	tx, err := s.db.BeginTx(ctx, nil)
 	if err != nil {
 		return fmt.Errorf("failed to begin transaction: %w", err)
 	}
 	defer tx.Rollback()
 	stmt, err := tx.PrepareContext(ctx, query)
 	if err != nil {
 		return fmt.Errorf("failed to prepare statement: %w", err)
 	}
 	defer stmt.Close()
 	for _, log := range buffer {
 		apacheJSON, _ := json.Marshal(log.Apache)
 		networkJSON, _ := json.Marshal(log.Network)
 		orphanSide := log.OrphanSide
 		if !log.Correlated {
 			orphanSide = log.OrphanSide
 		}
 		correlated := 0
 		if log.Correlated {
 			correlated = 1
 		}
 		_, err := stmt.ExecContext(ctx,
 			log.Timestamp,
 			log.SrcIP,
 			log.SrcPort,
 			log.DstIP,
 			log.DstPort,
 			correlated,
 			orphanSide,
 			string(apacheJSON),
 			string(networkJSON),
 		)
 		if err != nil {
 			return fmt.Errorf("failed to execute insert: %w", err)
 		}
 	}
 	if err := tx.Commit(); err != nil {
 		return fmt.Errorf("failed to commit transaction: %w", err)
 	}
 	return nil
 }
 // isRetryableError checks if an error is retryable.
 func isRetryableError(err error) bool {
 	if err == nil {
 		return false
 	}
 	errStr := err.Error()
 	// Common retryable errors
 	retryableErrors := []string{
 		"connection refused",
 		"connection reset",
 		"timeout",
 		"temporary failure",
 		"network is unreachable",
 		"broken pipe",
 	}
 	for _, re := range retryableErrors {
 		if containsIgnoreCase(errStr, re) {
 			return true
 		}
 	}
 	return false
 }
 func containsIgnoreCase(s, substr string) bool {
 	return len(s) >= len(substr) && containsLower(s, substr)
 }
 func containsLower(s, substr string) bool {
 	s = toLower(s)
 	substr = toLower(substr)
 	for i := 0; i <= len(s)-len(substr); i++ {
 		if s[i:i+len(substr)] == substr {
 			return true
 		}
 	}
 	return false
 }
 func toLower(s string) string {
 	var result []byte
 	for i := 0; i < len(s); i++ {
 		c := s[i]
 		if c >= 'A' && c <= 'Z' {
 			c = c + ('a' - 'A')
 		}
 		result = append(result, c)
 	}
 	return string(result)
 }
--- a/internal/adapters/outbound/clickhouse/sink_test.go
+++ b/internal/adapters/outbound/clickhouse/sink_test.go
@ -0,0 +1,305 @@
 package clickhouse
 import (
 	"context"
 	"testing"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 func TestClickHouseSink_Name(t *testing.T) {
 	sink := &ClickHouseSink{
 		config: Config{
 			DSN:   "clickhouse://test:test@localhost:9000/test",
 			Table: "test_table",
 		},
 	}
 	if sink.Name() != "clickhouse" {
 		t.Errorf("expected name 'clickhouse', got %s", sink.Name())
 	}
 }
 func TestClickHouseSink_ConfigDefaults(t *testing.T) {
 	// Test that defaults are applied correctly
 	config := Config{
 		DSN:   "clickhouse://test:test@localhost:9000/test",
 		Table: "test_table",
 		// Other fields are zero, should get defaults
 	}
 	// Verify defaults would be applied (we can't actually connect in tests)
 	if config.BatchSize <= 0 {
 		config.BatchSize = DefaultBatchSize
 	}
 	if config.FlushIntervalMs <= 0 {
 		config.FlushIntervalMs = DefaultFlushIntervalMs
 	}
 	if config.MaxBufferSize <= 0 {
 		config.MaxBufferSize = DefaultMaxBufferSize
 	}
 	if config.TimeoutMs <= 0 {
 		config.TimeoutMs = DefaultTimeoutMs
 	}
 	if config.BatchSize != DefaultBatchSize {
 		t.Errorf("expected BatchSize %d, got %d", DefaultBatchSize, config.BatchSize)
 	}
 	if config.FlushIntervalMs != DefaultFlushIntervalMs {
 		t.Errorf("expected FlushIntervalMs %d, got %d", DefaultFlushIntervalMs, config.FlushIntervalMs)
 	}
 	if config.MaxBufferSize != DefaultMaxBufferSize {
 		t.Errorf("expected MaxBufferSize %d, got %d", DefaultMaxBufferSize, config.MaxBufferSize)
 	}
 	if config.TimeoutMs != DefaultTimeoutMs {
 		t.Errorf("expected TimeoutMs %d, got %d", DefaultTimeoutMs, config.TimeoutMs)
 	}
 }
 func TestClickHouseSink_Write_BufferOverflow(t *testing.T) {
 	// This test verifies the buffer overflow logic without actually connecting
 	config := Config{
 		DSN:             "clickhouse://test:test@localhost:9000/test",
 		Table:           "test_table",
 		BatchSize:       10,
 		MaxBufferSize:   10,
 		DropOnOverflow:  true,
 		TimeoutMs:       100,
 		FlushIntervalMs: 1000,
 	}
 	// We can't test actual writes without a ClickHouse instance,
 	// but we can verify the config is valid
 	if config.BatchSize > config.MaxBufferSize {
 		t.Error("BatchSize should not exceed MaxBufferSize")
 	}
 }
 func TestClickHouseSink_IsRetryableError(t *testing.T) {
 	tests := []struct {
 		name     string
 		err      error
 		expected bool
 	}{
 		{"nil error", nil, false},
 		{"connection refused", &mockError{"connection refused"}, true},
 		{"connection reset", &mockError{"connection reset by peer"}, true},
 		{"timeout", &mockError{"timeout waiting for response"}, true},
 		{"network unreachable", &mockError{"network is unreachable"}, true},
 		{"broken pipe", &mockError{"broken pipe"}, true},
 		{"syntax error", &mockError{"syntax error in SQL"}, false},
 		{"table not found", &mockError{"table test not found"}, false},
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
 			result := isRetryableError(tt.err)
 			if result != tt.expected {
 				t.Errorf("expected %v, got %v", tt.expected, result)
 			}
 		})
 	}
 }
 func TestClickHouseSink_FlushEmpty(t *testing.T) {
 	// Test that flushing an empty buffer doesn't cause issues
 	// (We can't test actual ClickHouse operations without a real instance)
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:   "clickhouse://test:test@localhost:9000/test",
 			Table: "test_table",
 		},
 		buffer: make([]domain.CorrelatedLog, 0),
 	}
 	// Should not panic or error on empty flush
 	ctx := context.Background()
 	err := s.Flush(ctx)
 	if err != nil {
 		t.Errorf("expected no error on empty flush, got %v", err)
 	}
 }
 func TestClickHouseSink_CloseWithoutConnect(t *testing.T) {
 	// Test that closing without connecting doesn't panic
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:   "clickhouse://test:test@localhost:9000/test",
 			Table: "test_table",
 		},
 		buffer: make([]domain.CorrelatedLog, 0),
 		done:   make(chan struct{}),
 	}
 	err := s.Close()
 	if err != nil {
 		t.Errorf("expected no error on close without connect, got %v", err)
 	}
 }
 func TestClickHouseSink_Constants(t *testing.T) {
 	// Verify constants have reasonable values
 	if DefaultBatchSize <= 0 {
 		t.Error("DefaultBatchSize should be positive")
 	}
 	if DefaultFlushIntervalMs <= 0 {
 		t.Error("DefaultFlushIntervalMs should be positive")
 	}
 	if DefaultMaxBufferSize <= 0 {
 		t.Error("DefaultMaxBufferSize should be positive")
 	}
 	if DefaultTimeoutMs <= 0 {
 		t.Error("DefaultTimeoutMs should be positive")
 	}
 	if DefaultPingTimeoutMs <= 0 {
 		t.Error("DefaultPingTimeoutMs should be positive")
 	}
 	if MaxRetries <= 0 {
 		t.Error("MaxRetries should be positive")
 	}
 	if RetryBaseDelay <= 0 {
 		t.Error("RetryBaseDelay should be positive")
 	}
 }
 // mockError implements error for testing
 type mockError struct {
 	msg string
 }
 func (e *mockError) Error() string {
 	return e.msg
 }
 // Test the doFlush function with empty buffer (no actual DB connection)
 func TestClickHouseSink_DoFlushEmpty(t *testing.T) {
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:   "clickhouse://test:test@localhost:9000/test",
 			Table: "test_table",
 		},
 		buffer: make([]domain.CorrelatedLog, 0),
 	}
 	ctx := context.Background()
 	err := s.doFlush(ctx)
 	if err != nil {
 		t.Errorf("expected no error when flushing empty buffer, got %v", err)
 	}
 }
 // Test that buffer is properly managed (without actual DB operations)
 func TestClickHouseSink_BufferManagement(t *testing.T) {
 	log := domain.CorrelatedLog{
 		SrcIP:      "192.168.1.1",
 		SrcPort:    8080,
 		Correlated: true,
 	}
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:             "clickhouse://test:test@localhost:9000/test",
 			Table:           "test_table",
 			MaxBufferSize:   100, // Allow more than 1 element
 			DropOnOverflow:  false,
 			TimeoutMs:       1000,
 		},
 		buffer: []domain.CorrelatedLog{log},
 	}
 	// Verify buffer has data
 	if len(s.buffer) != 1 {
 		t.Fatalf("expected buffer length 1, got %d", len(s.buffer))
 	}
 	// Test that Write properly adds to buffer
 	ctx := context.Background()
 	err := s.Write(ctx, log)
 	if err != nil {
 		t.Errorf("unexpected error on Write: %v", err)
 	}
 	if len(s.buffer) != 2 {
 		t.Errorf("expected buffer length 2 after Write, got %d", len(s.buffer))
 	}
 }
 // Test Write with context cancellation
 func TestClickHouseSink_Write_ContextCancel(t *testing.T) {
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:             "clickhouse://test:test@localhost:9000/test",
 			Table:           "test_table",
 			MaxBufferSize:   1,
 			DropOnOverflow:  false,
 			TimeoutMs:       10,
 		},
 		buffer: make([]domain.CorrelatedLog, 0, 1),
 	}
 	// Fill the buffer
 	log := domain.CorrelatedLog{SrcIP: "192.168.1.1", SrcPort: 8080}
 	s.buffer = append(s.buffer, log)
 	// Try to write with cancelled context
 	ctx, cancel := context.WithCancel(context.Background())
 	cancel() // Cancel immediately
 	err := s.Write(ctx, log)
 	if err == nil {
 		t.Error("expected error when writing with cancelled context")
 	}
 }
 // Test DropOnOverflow behavior
 func TestClickHouseSink_Write_DropOnOverflow(t *testing.T) {
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:             "clickhouse://test:test@localhost:9000/test",
 			Table:           "test_table",
 			MaxBufferSize:   1,
 			DropOnOverflow:  true,
 			TimeoutMs:       10,
 		},
 		buffer: make([]domain.CorrelatedLog, 0, 1),
 	}
 	// Fill the buffer
 	log := domain.CorrelatedLog{SrcIP: "192.168.1.1", SrcPort: 8080}
 	s.buffer = append(s.buffer, log)
 	// Try to write when buffer is full - should drop silently
 	ctx := context.Background()
 	err := s.Write(ctx, log)
 	if err != nil {
 		t.Errorf("expected no error when DropOnOverflow is true, got %v", err)
 	}
 }
 // Benchmark Write operation (without actual DB)
 func BenchmarkClickHouseSink_Write(b *testing.B) {
 	s := &ClickHouseSink{
 		config: Config{
 			DSN:             "clickhouse://test:test@localhost:9000/test",
 			Table:           "test_table",
 			MaxBufferSize:   10000,
 			DropOnOverflow:  true,
 		},
 		buffer: make([]domain.CorrelatedLog, 0, 10000),
 	}
 	log := domain.CorrelatedLog{
 		Timestamp:  time.Now(),
 		SrcIP:      "192.168.1.1",
 		SrcPort:    8080,
 		Correlated: true,
 	}
 	ctx := context.Background()
 	b.ResetTimer()
 	for i := 0; i < b.N; i++ {
 		s.Write(ctx, log)
 	}
 }
--- a/internal/adapters/outbound/file/sink.go
+++ b/internal/adapters/outbound/file/sink.go
@ -0,0 +1,168 @@
 package file
 import (
 	"bufio"
 	"context"
 	"encoding/json"
 	"fmt"
 	"os"
 	"path/filepath"
 	"strings"
 	"sync"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 const (
 	// DefaultFilePermissions for output files
 	DefaultFilePermissions os.FileMode = 0644
 	// DefaultDirPermissions for output directories
 	DefaultDirPermissions os.FileMode = 0750
 )
 // Config holds the file sink configuration.
 type Config struct {
 	Path string
 }
 // FileSink writes correlated logs to a file as JSON lines.
 type FileSink struct {
 	config Config
 	mu     sync.Mutex
 	file   *os.File
 	writer *bufio.Writer
 }
 // NewFileSink creates a new file sink.
 func NewFileSink(config Config) (*FileSink, error) {
 	// Validate path
 	if err := validateFilePath(config.Path); err != nil {
 		return nil, fmt.Errorf("invalid file path: %w", err)
 	}
 	return &FileSink{
 		config: config,
 	}, nil
 }
 // Name returns the sink name.
 func (s *FileSink) Name() string {
 	return "file"
 }
 // Write writes a correlated log to the file.
 func (s *FileSink) Write(ctx context.Context, log domain.CorrelatedLog) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	if s.file == nil {
 		if err := s.openFile(); err != nil {
 			return err
 		}
 	}
 	data, err := json.Marshal(log)
 	if err != nil {
 		return fmt.Errorf("failed to marshal log: %w", err)
 	}
 	if _, err := s.writer.Write(data); err != nil {
 		return fmt.Errorf("failed to write log: %w", err)
 	}
 	if _, err := s.writer.WriteString("\n"); err != nil {
 		return fmt.Errorf("failed to write newline: %w", err)
 	}
 	return nil
 }
 // Flush flushes any buffered data.
 func (s *FileSink) Flush(ctx context.Context) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	if s.writer != nil {
 		return s.writer.Flush()
 	}
 	return nil
 }
 // Close closes the sink.
 func (s *FileSink) Close() error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	if s.writer != nil {
 		if err := s.writer.Flush(); err != nil {
 			return err
 		}
 	}
 	if s.file != nil {
 		return s.file.Close()
 	}
 	return nil
 }
 func (s *FileSink) openFile() error {
 	// Validate path again before opening
 	if err := validateFilePath(s.config.Path); err != nil {
 		return fmt.Errorf("invalid file path: %w", err)
 	}
 	// Ensure directory exists
 	dir := filepath.Dir(s.config.Path)
 	if err := os.MkdirAll(dir, DefaultDirPermissions); err != nil {
 		return fmt.Errorf("failed to create directory: %w", err)
 	}
 	file, err := os.OpenFile(s.config.Path, os.O_APPEND|os.O_CREATE|os.O_WRONLY, DefaultFilePermissions)
 	if err != nil {
 		return fmt.Errorf("failed to open file: %w", err)
 	}
 	s.file = file
 	s.writer = bufio.NewWriter(file)
 	return nil
 }
 // validateFilePath validates that the file path is safe and allowed.
 func validateFilePath(path string) error {
 	if path == "" {
 		return fmt.Errorf("path cannot be empty")
 	}
 	// Clean the path
 	cleanPath := filepath.Clean(path)
 	// Ensure path is absolute or relative to allowed directories
 	allowedPrefixes := []string{
 		"/var/log/logcorrelator",
 		"/var/log",
 		"/tmp",
 	}
 	// Check if path is in allowed directories
 	allowed := false
 	for _, prefix := range allowedPrefixes {
 		if strings.HasPrefix(cleanPath, prefix) {
 			allowed = true
 			break
 		}
 	}
 	if !allowed {
 		// Allow relative paths for testing
 		if !filepath.IsAbs(cleanPath) {
 			return nil
 		}
 		return fmt.Errorf("path must be in allowed directories: %v", allowedPrefixes)
 	}
 	// Check for path traversal
 	if strings.Contains(cleanPath, "..") {
 		return fmt.Errorf("path cannot contain '..'")
 	}
 	return nil
 }
--- a/internal/adapters/outbound/file/sink_test.go
+++ b/internal/adapters/outbound/file/sink_test.go
@ -0,0 +1,96 @@
 package file
 import (
 	"context"
 	"os"
 	"path/filepath"
 	"testing"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 func TestFileSink_Write(t *testing.T) {
 	tmpDir := t.TempDir()
 	testPath := filepath.Join(tmpDir, "test.log")
 	sink, err := NewFileSink(Config{Path: testPath})
 	if err != nil {
 		t.Fatalf("failed to create sink: %v", err)
 	}
 	defer sink.Close()
 	log := domain.CorrelatedLog{
 		SrcIP:      "192.168.1.1",
 		SrcPort:    8080,
 		Correlated: true,
 	}
 	if err := sink.Write(context.Background(), log); err != nil {
 		t.Fatalf("failed to write: %v", err)
 	}
 	if err := sink.Flush(context.Background()); err != nil {
 		t.Fatalf("failed to flush: %v", err)
 	}
 	// Verify file exists and contains data
 	data, err := os.ReadFile(testPath)
 	if err != nil {
 		t.Fatalf("failed to read file: %v", err)
 	}
 	if len(data) == 0 {
 		t.Error("expected non-empty file")
 	}
 }
 func TestFileSink_MultipleWrites(t *testing.T) {
 	tmpDir := t.TempDir()
 	testPath := filepath.Join(tmpDir, "test.log")
 	sink, err := NewFileSink(Config{Path: testPath})
 	if err != nil {
 		t.Fatalf("failed to create sink: %v", err)
 	}
 	defer sink.Close()
 	for i := 0; i < 5; i++ {
 		log := domain.CorrelatedLog{
 			SrcIP:   "192.168.1.1",
 			SrcPort: 8080 + i,
 		}
 		if err := sink.Write(context.Background(), log); err != nil {
 			t.Fatalf("failed to write: %v", err)
 		}
 	}
 	sink.Close()
 	// Verify file has 5 lines
 	data, err := os.ReadFile(testPath)
 	if err != nil {
 		t.Fatalf("failed to read file: %v", err)
 	}
 	lines := 0
 	for _, b := range data {
 		if b == '\n' {
 			lines++
 		}
 	}
 	if lines != 5 {
 		t.Errorf("expected 5 lines, got %d", lines)
 	}
 }
 func TestFileSink_Name(t *testing.T) {
 	sink, err := NewFileSink(Config{Path: "/tmp/test.log"})
 	if err != nil {
 		t.Fatalf("failed to create sink: %v", err)
 	}
 	if sink.Name() != "file" {
 		t.Errorf("expected name 'file', got %s", sink.Name())
 	}
 }
--- a/internal/adapters/outbound/multi/sink.go
+++ b/internal/adapters/outbound/multi/sink.go
@ -0,0 +1,123 @@
 package multi
 import (
 	"context"
 	"sync"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 	"github.com/logcorrelator/logcorrelator/internal/ports"
 )
 // MultiSink fans out correlated logs to multiple sinks.
 type MultiSink struct {
 	mu    sync.RWMutex
 	sinks []ports.CorrelatedLogSink
 }
 // NewMultiSink creates a new multi-sink.
 func NewMultiSink(sinks ...ports.CorrelatedLogSink) *MultiSink {
 	return &MultiSink{
 		sinks: sinks,
 	}
 }
 // Name returns the sink name.
 func (s *MultiSink) Name() string {
 	return "multi"
 }
 // AddSink adds a sink to the fan-out.
 func (s *MultiSink) AddSink(sink ports.CorrelatedLogSink) {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	s.sinks = append(s.sinks, sink)
 }
 // Write writes a correlated log to all sinks concurrently.
 // Returns the first error encountered (but all sinks are attempted).
 func (s *MultiSink) Write(ctx context.Context, log domain.CorrelatedLog) error {
 	s.mu.RLock()
 	sinks := make([]ports.CorrelatedLogSink, len(s.sinks))
 	copy(sinks, s.sinks)
 	s.mu.RUnlock()
 	if len(sinks) == 0 {
 		return nil
 	}
 	var wg sync.WaitGroup
 	var firstErr error
 	var firstErrMu sync.Mutex
 	errChan := make(chan error, len(sinks))
 	for _, sink := range sinks {
 		wg.Add(1)
 		go func(sk ports.CorrelatedLogSink) {
 			defer wg.Done()
 			if err := sk.Write(ctx, log); err != nil {
 				// Non-blocking send to errChan
 				select {
 				case errChan <- err:
 				default:
 					// Channel full, error will be handled via firstErr
 				}
 			}
 		}(sink)
 	}
 	// Wait for all writes to complete in a separate goroutine
 	done := make(chan struct{})
 	go func() {
 		wg.Wait()
 		close(done)
 	}()
 	// Collect errors with timeout
 	select {
 	case <-done:
 		close(errChan)
 		// Collect first error
 		for err := range errChan {
 			if err != nil {
 				firstErrMu.Lock()
 				if firstErr == nil {
 					firstErr = err
 				}
 				firstErrMu.Unlock()
 			}
 		}
 	case <-ctx.Done():
 		return ctx.Err()
 	}
 	firstErrMu.Lock()
 	defer firstErrMu.Unlock()
 	return firstErr
 }
 // Flush flushes all sinks.
 func (s *MultiSink) Flush(ctx context.Context) error {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	for _, sink := range s.sinks {
 		if err := sink.Flush(ctx); err != nil {
 			return err
 		}
 	}
 	return nil
 }
 // Close closes all sinks.
 func (s *MultiSink) Close() error {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	var firstErr error
 	for _, sink := range s.sinks {
 		if err := sink.Close(); err != nil && firstErr == nil {
 			firstErr = err
 		}
 	}
 	return firstErr
 }
--- a/internal/adapters/outbound/multi/sink_test.go
+++ b/internal/adapters/outbound/multi/sink_test.go
@ -0,0 +1,114 @@
 package multi
 import (
 	"context"
 	"sync"
 	"testing"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 type mockSink struct {
 	name      string
 	mu        sync.Mutex
 	writeFunc func(domain.CorrelatedLog) error
 	flushFunc func() error
 	closeFunc func() error
 }
 func (m *mockSink) Name() string                              { return m.name }
 func (m *mockSink) Write(ctx context.Context, log domain.CorrelatedLog) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	return m.writeFunc(log)
 }
 func (m *mockSink) Flush(ctx context.Context) error { return m.flushFunc() }
 func (m *mockSink) Close() error                    { return m.closeFunc() }
 func TestMultiSink_Write(t *testing.T) {
 	var mu sync.Mutex
 	writeCount := 0
 	sink1 := &mockSink{
 		name: "sink1",
 		writeFunc: func(log domain.CorrelatedLog) error {
 			mu.Lock()
 			writeCount++
 			mu.Unlock()
 			return nil
 		},
 		flushFunc: func() error { return nil },
 		closeFunc: func() error { return nil },
 	}
 	sink2 := &mockSink{
 		name: "sink2",
 		writeFunc: func(log domain.CorrelatedLog) error {
 			mu.Lock()
 			writeCount++
 			mu.Unlock()
 			return nil
 		},
 		flushFunc: func() error { return nil },
 		closeFunc: func() error { return nil },
 	}
 	ms := NewMultiSink(sink1, sink2)
 	log := domain.CorrelatedLog{SrcIP: "192.168.1.1"}
 	err := ms.Write(context.Background(), log)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if writeCount != 2 {
 		t.Errorf("expected 2 writes, got %d", writeCount)
 	}
 }
 func TestMultiSink_Write_OneFails(t *testing.T) {
 	sink1 := &mockSink{
 		name: "sink1",
 		writeFunc: func(log domain.CorrelatedLog) error {
 			return nil
 		},
 		flushFunc: func() error { return nil },
 		closeFunc: func() error { return nil },
 	}
 	sink2 := &mockSink{
 		name: "sink2",
 		writeFunc: func(log domain.CorrelatedLog) error {
 			return context.Canceled
 		},
 		flushFunc: func() error { return nil },
 		closeFunc: func() error { return nil },
 	}
 	ms := NewMultiSink(sink1, sink2)
 	log := domain.CorrelatedLog{SrcIP: "192.168.1.1"}
 	err := ms.Write(context.Background(), log)
 	if err == nil {
 		t.Error("expected error when one sink fails")
 	}
 }
 func TestMultiSink_AddSink(t *testing.T) {
 	ms := NewMultiSink()
 	sink := &mockSink{
 		name: "dynamic",
 		writeFunc: func(log domain.CorrelatedLog) error { return nil },
 		flushFunc: func() error { return nil },
 		closeFunc: func() error { return nil },
 	}
 	ms.AddSink(sink)
 	log := domain.CorrelatedLog{SrcIP: "192.168.1.1"}
 	err := ms.Write(context.Background(), log)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 }
--- a/internal/app/orchestrator.go
+++ b/internal/app/orchestrator.go
@ -0,0 +1,158 @@
 package app
 import (
 	"context"
 	"sync"
 	"sync/atomic"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 	"github.com/logcorrelator/logcorrelator/internal/ports"
 )
 const (
 	// DefaultEventChannelBufferSize is the default size for event channels
 	DefaultEventChannelBufferSize = 1000
 	// ShutdownTimeout is the maximum time to wait for graceful shutdown
 	ShutdownTimeout = 30 * time.Second
 )
 // OrchestratorConfig holds the orchestrator configuration.
 type OrchestratorConfig struct {
 	Sources []ports.EventSource
 	Sink    ports.CorrelatedLogSink
 }
 // Orchestrator connects sources to the correlation service and sinks.
 type Orchestrator struct {
 	config           OrchestratorConfig
 	correlationSvc   ports.CorrelationProcessor
 	ctx              context.Context
 	cancel           context.CancelFunc
 	wg               sync.WaitGroup
 	running          atomic.Bool
 }
 // NewOrchestrator creates a new orchestrator.
 func NewOrchestrator(config OrchestratorConfig, correlationSvc ports.CorrelationProcessor) *Orchestrator {
 	ctx, cancel := context.WithCancel(context.Background())
 	return &Orchestrator{
 		config:         config,
 		correlationSvc: correlationSvc,
 		ctx:            ctx,
 		cancel:         cancel,
 	}
 }
 // Start begins the orchestration.
 func (o *Orchestrator) Start() error {
 	if !o.running.CompareAndSwap(false, true) {
 		return nil // Already running
 	}
 	// Start each source
 	for _, source := range o.config.Sources {
 		eventChan := make(chan *domain.NormalizedEvent, DefaultEventChannelBufferSize)
 		o.wg.Add(1)
 		go func(src ports.EventSource, evChan chan *domain.NormalizedEvent) {
 			defer o.wg.Done()
 			o.processEvents(evChan)
 		}(source, eventChan)
 		o.wg.Add(1)
 		go func(src ports.EventSource, evChan chan *domain.NormalizedEvent) {
 			defer o.wg.Done()
 			if err := src.Start(o.ctx, evChan); err != nil {
 				// Source failed, but continue with others
 			}
 		}(source, eventChan)
 	}
 	return nil
 }
 func (o *Orchestrator) processEvents(eventChan <-chan *domain.NormalizedEvent) {
 	for {
 		select {
 		case <-o.ctx.Done():
 			// Drain remaining events before exiting
 			for {
 				select {
 				case event, ok := <-eventChan:
 					if !ok {
 						return
 					}
 					logs := o.correlationSvc.ProcessEvent(event)
 					for _, log := range logs {
 						o.config.Sink.Write(o.ctx, log)
 					}
 				default:
 					return
 				}
 			}
 		case event, ok := <-eventChan:
 			if !ok {
 				return
 			}
 			// Process through correlation service
 			logs := o.correlationSvc.ProcessEvent(event)
 			// Write correlated logs to sink
 			for _, log := range logs {
 				if err := o.config.Sink.Write(o.ctx, log); err != nil {
 					// Log error but continue processing
 				}
 			}
 		}
 	}
 }
 // Stop gracefully stops the orchestrator.
 // It stops all sources first, then flushes remaining events, then closes sinks.
 func (o *Orchestrator) Stop() error {
 	if !o.running.CompareAndSwap(true, false) {
 		return nil // Not running
 	}
 	// Create shutdown context with timeout
 	shutdownCtx, shutdownCancel := context.WithTimeout(context.Background(), ShutdownTimeout)
 	defer shutdownCancel()
 	// First, cancel the main context to stop accepting new events
 	o.cancel()
 	// Wait for source goroutines to finish
 	// Use a separate goroutine with timeout to prevent deadlock
 	done := make(chan struct{})
 	go func() {
 		o.wg.Wait()
 		close(done)
 	}()
 	select {
 	case <-done:
 		// Sources stopped cleanly
 	case <-shutdownCtx.Done():
 		// Timeout waiting for sources
 	}
 	// Flush remaining events from correlation service
 	flushedLogs := o.correlationSvc.Flush()
 	for _, log := range flushedLogs {
 		if err := o.config.Sink.Write(shutdownCtx, log); err != nil {
 			// Log error but continue
 		}
 	}
 	// Flush and close sink with timeout
 	if err := o.config.Sink.Flush(shutdownCtx); err != nil {
 		// Log error
 	}
 	if err := o.config.Sink.Close(); err != nil {
 		// Log error
 	}
 	return nil
 }
--- a/internal/app/orchestrator_test.go
+++ b/internal/app/orchestrator_test.go
@ -0,0 +1,160 @@
 package app
 import (
 	"context"
 	"sync"
 	"testing"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 	"github.com/logcorrelator/logcorrelator/internal/ports"
 )
 type mockEventSource struct {
 	name      string
 	mu        sync.RWMutex
 	eventChan chan<- *domain.NormalizedEvent
 	started   bool
 	stopped   bool
 }
 func (m *mockEventSource) Name() string { return m.name }
 func (m *mockEventSource) Start(ctx context.Context, eventChan chan<- *domain.NormalizedEvent) error {
 	m.mu.Lock()
 	m.started = true
 	m.eventChan = eventChan
 	m.mu.Unlock()
 	<-ctx.Done()
 	m.mu.Lock()
 	m.stopped = true
 	m.mu.Unlock()
 	return nil
 }
 func (m *mockEventSource) Stop() error { return nil }
 func (m *mockEventSource) getEventChan() chan<- *domain.NormalizedEvent {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	return m.eventChan
 }
 func (m *mockEventSource) isStarted() bool {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	return m.started
 }
 type mockSink struct {
 	mu      sync.Mutex
 	written []domain.CorrelatedLog
 }
 func (m *mockSink) Name() string { return "mock" }
 func (m *mockSink) Write(ctx context.Context, log domain.CorrelatedLog) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.written = append(m.written, log)
 	return nil
 }
 func (m *mockSink) Flush(ctx context.Context) error { return nil }
 func (m *mockSink) Close() error                    { return nil }
 func (m *mockSink) getWritten() []domain.CorrelatedLog {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	result := make([]domain.CorrelatedLog, len(m.written))
 	copy(result, m.written)
 	return result
 }
 func TestOrchestrator_StartStop(t *testing.T) {
 	source := &mockEventSource{name: "test"}
 	sink := &mockSink{}
 	corrConfig := domain.CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: true,
 		NetworkEmit:      false,
 	}
 	correlationSvc := domain.NewCorrelationService(corrConfig, &domain.RealTimeProvider{})
 	orchestrator := NewOrchestrator(OrchestratorConfig{
 		Sources: []ports.EventSource{source},
 		Sink:    sink,
 	}, correlationSvc)
 	if err := orchestrator.Start(); err != nil {
 		t.Fatalf("failed to start: %v", err)
 	}
 	// Let it run briefly
 	time.Sleep(100 * time.Millisecond)
 	if err := orchestrator.Stop(); err != nil {
 		t.Fatalf("failed to stop: %v", err)
 	}
 	if !source.isStarted() {
 		t.Error("expected source to be started")
 	}
 }
 func TestOrchestrator_ProcessEvent(t *testing.T) {
 	source := &mockEventSource{name: "test"}
 	sink := &mockSink{}
 	corrConfig := domain.CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: true,
 		NetworkEmit:      false,
 	}
 	correlationSvc := domain.NewCorrelationService(corrConfig, &domain.RealTimeProvider{})
 	orchestrator := NewOrchestrator(OrchestratorConfig{
 		Sources: []ports.EventSource{source},
 		Sink:    sink,
 	}, correlationSvc)
 	if err := orchestrator.Start(); err != nil {
 		t.Fatalf("failed to start: %v", err)
 	}
 	// Wait for source to start and get the channel
 	var eventChan chan<- *domain.NormalizedEvent
 	for i := 0; i < 50; i++ {
 		eventChan = source.getEventChan()
 		if eventChan != nil {
 			break
 		}
 		time.Sleep(10 * time.Millisecond)
 	}
 	if eventChan == nil {
 		t.Fatal("source did not start properly")
 	}
 	// Send an event through the source
 	event := &domain.NormalizedEvent{
 		Source:    domain.SourceA,
 		Timestamp: time.Now(),
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		Raw:       map[string]any{"method": "GET"},
 	}
 	// Send event
 	eventChan <- event
 	// Give it time to process
 	time.Sleep(100 * time.Millisecond)
 	if err := orchestrator.Stop(); err != nil {
 		t.Fatalf("failed to stop: %v", err)
 	}
 	// Should have written at least one log (the orphan A)
 	written := sink.getWritten()
 	if len(written) == 0 {
 		t.Error("expected at least one log to be written")
 	}
 }
--- a/internal/config/config.go
+++ b/internal/config/config.go
@ -0,0 +1,340 @@
 package config
 import (
 	"bufio"
 	"fmt"
 	"os"
 	"strconv"
 	"strings"
 	"time"
 )
 // Config holds the complete application configuration.
 type Config struct {
 	Service     ServiceConfig
 	Inputs      InputsConfig
 	Outputs     OutputsConfig
 	Correlation CorrelationConfig
 }
 // ServiceConfig holds service-level configuration.
 type ServiceConfig struct {
 	Name     string
 	Language string
 }
 // InputsConfig holds input sources configuration.
 type InputsConfig struct {
 	UnixSockets []UnixSocketConfig
 }
 // UnixSocketConfig holds a Unix socket source configuration.
 type UnixSocketConfig struct {
 	Name   string
 	Path   string
 	Format string
 }
 // OutputsConfig holds output sinks configuration.
 type OutputsConfig struct {
 	File       FileOutputConfig
 	ClickHouse ClickHouseOutputConfig
 	Stdout     StdoutOutputConfig
 }
 // FileOutputConfig holds file sink configuration.
 type FileOutputConfig struct {
 	Enabled bool
 	Path    string
 }
 // ClickHouseOutputConfig holds ClickHouse sink configuration.
 type ClickHouseOutputConfig struct {
 	Enabled         bool
 	DSN             string
 	Table           string
 	BatchSize       int
 	FlushIntervalMs int
 	MaxBufferSize   int
 	DropOnOverflow  bool
 	AsyncInsert     bool
 	TimeoutMs       int
 }
 // StdoutOutputConfig holds stdout sink configuration.
 type StdoutOutputConfig struct {
 	Enabled bool
 }
 // CorrelationConfig holds correlation configuration.
 type CorrelationConfig struct {
 	Key          []string
 	TimeWindow   TimeWindowConfig
 	OrphanPolicy OrphanPolicyConfig
 }
 // TimeWindowConfig holds time window configuration.
 type TimeWindowConfig struct {
 	Value int
 	Unit  string
 }
 // OrphanPolicyConfig holds orphan event policy configuration.
 type OrphanPolicyConfig struct {
 	ApacheAlwaysEmit bool
 	NetworkEmit      bool
 }
 // Load loads configuration from a text file with directives.
 func Load(path string) (*Config, error) {
 	file, err := os.Open(path)
 	if err != nil {
 		return nil, fmt.Errorf("failed to open config file: %w", err)
 	}
 	defer file.Close()
 	cfg := &Config{
 		Service: ServiceConfig{
 			Name:     "logcorrelator",
 			Language: "go",
 		},
 		Inputs: InputsConfig{
 			UnixSockets: make([]UnixSocketConfig, 0),
 		},
 		Outputs: OutputsConfig{
 			File: FileOutputConfig{
 				Enabled: true,
 				Path:    "/var/log/logcorrelator/correlated.log",
 			},
 			ClickHouse: ClickHouseOutputConfig{
 				Enabled:         false,
 				BatchSize:       500,
 				FlushIntervalMs: 200,
 				MaxBufferSize:   5000,
 				DropOnOverflow:  true,
 				AsyncInsert:     true,
 				TimeoutMs:       1000,
 			},
 			Stdout: StdoutOutputConfig{
 				Enabled: false,
 			},
 		},
 		Correlation: CorrelationConfig{
 			Key: []string{"src_ip", "src_port"},
 			TimeWindow: TimeWindowConfig{
 				Value: 1,
 				Unit:  "s",
 			},
 			OrphanPolicy: OrphanPolicyConfig{
 				ApacheAlwaysEmit: true,
 				NetworkEmit:      false,
 			},
 		},
 	}
 	scanner := bufio.NewScanner(file)
 	lineNum := 0
 	for scanner.Scan() {
 		lineNum++
 		line := strings.TrimSpace(scanner.Text())
 		// Skip empty lines and comments
 		if line == "" || strings.HasPrefix(line, "#") {
 			continue
 		}
 		if err := parseDirective(cfg, line); err != nil {
 			return nil, fmt.Errorf("line %d: %w", lineNum, err)
 		}
 	}
 	if err := scanner.Err(); err != nil {
 		return nil, fmt.Errorf("failed to read config file: %w", err)
 	}
 	if err := cfg.Validate(); err != nil {
 		return nil, fmt.Errorf("invalid config: %w", err)
 	}
 	return cfg, nil
 }
 func parseDirective(cfg *Config, line string) error {
 	parts := strings.Fields(line)
 	if len(parts) < 2 {
 		return fmt.Errorf("invalid directive: %s", line)
 	}
 	directive := parts[0]
 	value := strings.Join(parts[1:], " ")
 	switch directive {
 	case "service.name":
 		cfg.Service.Name = value
 	case "service.language":
 		cfg.Service.Language = value
 	case "input.unix_socket":
 		// Format: input.unix_socket <name> <path> [format]
 		if len(parts) < 3 {
 			return fmt.Errorf("input.unix_socket requires name and path")
 		}
 		format := "json"
 		if len(parts) >= 4 {
 			format = parts[3]
 		}
 		cfg.Inputs.UnixSockets = append(cfg.Inputs.UnixSockets, UnixSocketConfig{
 			Name:   parts[1],
 			Path:   parts[2],
 			Format: format,
 		})
 	case "output.file.enabled":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.file.enabled: %w", err)
 		}
 		cfg.Outputs.File.Enabled = enabled
 	case "output.file.path":
 		cfg.Outputs.File.Path = value
 	case "output.clickhouse.enabled":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.enabled: %w", err)
 		}
 		cfg.Outputs.ClickHouse.Enabled = enabled
 	case "output.clickhouse.dsn":
 		cfg.Outputs.ClickHouse.DSN = value
 	case "output.clickhouse.table":
 		cfg.Outputs.ClickHouse.Table = value
 	case "output.clickhouse.batch_size":
 		v, err := strconv.Atoi(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.batch_size: %w", err)
 		}
 		cfg.Outputs.ClickHouse.BatchSize = v
 	case "output.clickhouse.flush_interval_ms":
 		v, err := strconv.Atoi(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.flush_interval_ms: %w", err)
 		}
 		cfg.Outputs.ClickHouse.FlushIntervalMs = v
 	case "output.clickhouse.max_buffer_size":
 		v, err := strconv.Atoi(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.max_buffer_size: %w", err)
 		}
 		cfg.Outputs.ClickHouse.MaxBufferSize = v
 	case "output.clickhouse.drop_on_overflow":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.drop_on_overflow: %w", err)
 		}
 		cfg.Outputs.ClickHouse.DropOnOverflow = enabled
 	case "output.clickhouse.async_insert":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.async_insert: %w", err)
 		}
 		cfg.Outputs.ClickHouse.AsyncInsert = enabled
 	case "output.clickhouse.timeout_ms":
 		v, err := strconv.Atoi(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.clickhouse.timeout_ms: %w", err)
 		}
 		cfg.Outputs.ClickHouse.TimeoutMs = v
 	case "output.stdout.enabled":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for output.stdout.enabled: %w", err)
 		}
 		cfg.Outputs.Stdout.Enabled = enabled
 	case "correlation.key":
 		cfg.Correlation.Key = strings.Split(value, ",")
 		for i, k := range cfg.Correlation.Key {
 			cfg.Correlation.Key[i] = strings.TrimSpace(k)
 		}
 	case "correlation.time_window.value":
 		v, err := strconv.Atoi(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for correlation.time_window.value: %w", err)
 		}
 		cfg.Correlation.TimeWindow.Value = v
 	case "correlation.time_window.unit":
 		cfg.Correlation.TimeWindow.Unit = value
 	case "correlation.orphan_policy.apache_always_emit":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for correlation.orphan_policy.apache_always_emit: %w", err)
 		}
 		cfg.Correlation.OrphanPolicy.ApacheAlwaysEmit = enabled
 	case "correlation.orphan_policy.network_emit":
 		enabled, err := parseBool(value)
 		if err != nil {
 			return fmt.Errorf("invalid value for correlation.orphan_policy.network_emit: %w", err)
 		}
 		cfg.Correlation.OrphanPolicy.NetworkEmit = enabled
 	default:
 		return fmt.Errorf("unknown directive: %s", directive)
 	}
 	return nil
 }
 func parseBool(s string) (bool, error) {
 	s = strings.ToLower(s)
 	switch s {
 	case "true", "yes", "1", "on":
 		return true, nil
 	case "false", "no", "0", "off":
 		return false, nil
 	default:
 		return false, fmt.Errorf("invalid boolean value: %s", s)
 	}
 }
 // Validate validates the configuration.
 func (c *Config) Validate() error {
 	if len(c.Inputs.UnixSockets) < 2 {
 		return fmt.Errorf("at least two unix socket inputs are required")
 	}
 	if !c.Outputs.File.Enabled && !c.Outputs.ClickHouse.Enabled && !c.Outputs.Stdout.Enabled {
 		return fmt.Errorf("at least one output must be enabled")
 	}
 	if c.Outputs.ClickHouse.Enabled && c.Outputs.ClickHouse.DSN == "" {
 		return fmt.Errorf("clickhouse DSN is required when enabled")
 	}
 	return nil
 }
 // GetTimeWindow returns the time window as a duration.
 func (c *CorrelationConfig) GetTimeWindow() time.Duration {
 	value := c.TimeWindow.Value
 	if value <= 0 {
 		value = 1
 	}
 	unit := c.TimeWindow.Unit
 	if unit == "" {
 		unit = "s"
 	}
 	switch unit {
 	case "ms", "millisecond", "milliseconds":
 		return time.Duration(value) * time.Millisecond
 	case "s", "second", "seconds":
 		return time.Duration(value) * time.Second
 	case "m", "minute", "minutes":
 		return time.Duration(value) * time.Minute
 	default:
 		return time.Duration(value) * time.Second
 	}
 }
--- a/internal/config/config_test.go
+++ b/internal/config/config_test.go
@ -0,0 +1,224 @@
 package config
 import (
 	"os"
 	"path/filepath"
 	"testing"
 	"time"
 )
 func TestLoad_ValidConfig(t *testing.T) {
 	content := `
 # Test configuration
 service.name logcorrelator
 service.language go
 input.unix_socket apache_source /var/run/logcorrelator/apache.sock json
 input.unix_socket network_source /var/run/logcorrelator/network.sock json
 output.file.enabled true
 output.file.path /var/log/logcorrelator/correlated.log
 output.clickhouse.enabled false
 output.clickhouse.dsn clickhouse://user:pass@localhost:9000/db
 output.clickhouse.table correlated_logs
 correlation.key src_ip,src_port
 correlation.time_window.value 1
 correlation.time_window.unit s
 correlation.orphan_policy.apache_always_emit true
 correlation.orphan_policy.network_emit false
 `
 	tmpDir := t.TempDir()
 	configPath := filepath.Join(tmpDir, "config.conf")
 	if err := os.WriteFile(configPath, []byte(content), 0644); err != nil {
 		t.Fatalf("failed to write config: %v", err)
 	}
 	cfg, err := Load(configPath)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if cfg.Service.Name != "logcorrelator" {
 		t.Errorf("expected service name logcorrelator, got %s", cfg.Service.Name)
 	}
 	if len(cfg.Inputs.UnixSockets) != 2 {
 		t.Errorf("expected 2 unix sockets, got %d", len(cfg.Inputs.UnixSockets))
 	}
 	if !cfg.Outputs.File.Enabled {
 		t.Error("expected file output enabled")
 	}
 }
 func TestLoad_InvalidPath(t *testing.T) {
 	_, err := Load("/nonexistent/path/config.conf")
 	if err == nil {
 		t.Error("expected error for nonexistent path")
 	}
 }
 func TestLoad_InvalidDirective(t *testing.T) {
 	tmpDir := t.TempDir()
 	configPath := filepath.Join(tmpDir, "config.conf")
 	content := `invalid.directive value`
 	if err := os.WriteFile(configPath, []byte(content), 0644); err != nil {
 		t.Fatalf("failed to write config: %v", err)
 	}
 	_, err := Load(configPath)
 	if err == nil {
 		t.Error("expected error for invalid directive")
 	}
 }
 func TestLoad_Comments(t *testing.T) {
 	tmpDir := t.TempDir()
 	configPath := filepath.Join(tmpDir, "config.conf")
 	content := `
 # This is a comment
 service.name logcorrelator
 # Another comment
 input.unix_socket test /tmp/test.sock json
 input.unix_socket test2 /tmp/test2.sock json
 output.file.enabled true
 `
 	if err := os.WriteFile(configPath, []byte(content), 0644); err != nil {
 		t.Fatalf("failed to write config: %v", err)
 	}
 	cfg, err := Load(configPath)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if cfg.Service.Name != "logcorrelator" {
 		t.Errorf("expected service name logcorrelator, got %s", cfg.Service.Name)
 	}
 }
 func TestValidate_MinimumInputs(t *testing.T) {
 	cfg := &Config{
 		Inputs: InputsConfig{
 			UnixSockets: []UnixSocketConfig{
 				{Name: "only_one", Path: "/tmp/test.sock"},
 			},
 		},
 		Outputs: OutputsConfig{
 			File: FileOutputConfig{Enabled: true},
 		},
 	}
 	err := cfg.Validate()
 	if err == nil {
 		t.Error("expected error for less than 2 inputs")
 	}
 }
 func TestValidate_AtLeastOneOutput(t *testing.T) {
 	cfg := &Config{
 		Inputs: InputsConfig{
 			UnixSockets: []UnixSocketConfig{
 				{Name: "a", Path: "/tmp/a.sock"},
 				{Name: "b", Path: "/tmp/b.sock"},
 			},
 		},
 		Outputs: OutputsConfig{
 			File:       FileOutputConfig{Enabled: false},
 			ClickHouse: ClickHouseOutputConfig{Enabled: false},
 			Stdout:     StdoutOutputConfig{Enabled: false},
 		},
 	}
 	err := cfg.Validate()
 	if err == nil {
 		t.Error("expected error for no outputs enabled")
 	}
 }
 func TestGetTimeWindow(t *testing.T) {
 	tests := []struct {
 		name     string
 		config   CorrelationConfig
 		expected time.Duration
 	}{
 		{
 			name: "seconds",
 			config: CorrelationConfig{
 				TimeWindow: TimeWindowConfig{Value: 1, Unit: "s"},
 			},
 			expected: time.Second,
 		},
 		{
 			name: "milliseconds",
 			config: CorrelationConfig{
 				TimeWindow: TimeWindowConfig{Value: 500, Unit: "ms"},
 			},
 			expected: 500 * time.Millisecond,
 		},
 		{
 			name: "minutes",
 			config: CorrelationConfig{
 				TimeWindow: TimeWindowConfig{Value: 2, Unit: "m"},
 			},
 			expected: 2 * time.Minute,
 		},
 		{
 			name: "default",
 			config: CorrelationConfig{
 				TimeWindow: TimeWindowConfig{},
 			},
 			expected: time.Second,
 		},
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
 			result := tt.config.GetTimeWindow()
 			if result != tt.expected {
 				t.Errorf("expected %v, got %v", tt.expected, result)
 			}
 		})
 	}
 }
 func TestParseBool(t *testing.T) {
 	tests := []struct {
 		input    string
 		expected bool
 		hasError bool
 	}{
 		{"true", true, false},
 		{"True", true, false},
 		{"TRUE", true, false},
 		{"yes", true, false},
 		{"1", true, false},
 		{"on", true, false},
 		{"false", false, false},
 		{"False", false, false},
 		{"no", false, false},
 		{"0", false, false},
 		{"off", false, false},
 		{"invalid", false, true},
 	}
 	for _, tt := range tests {
 		t.Run(tt.input, func(t *testing.T) {
 			result, err := parseBool(tt.input)
 			if tt.hasError {
 				if err == nil {
 					t.Error("expected error, got nil")
 				}
 			} else {
 				if err != nil {
 					t.Errorf("unexpected error: %v", err)
 				}
 				if result != tt.expected {
 					t.Errorf("expected %v, got %v", tt.expected, result)
 				}
 			}
 		})
 	}
 }
--- a/internal/domain/correlated_log.go
+++ b/internal/domain/correlated_log.go
@ -0,0 +1,90 @@
 package domain
 import "time"
 // CorrelatedLog represents the output correlated log entry.
 type CorrelatedLog struct {
 	Timestamp    time.Time        `json:"timestamp"`
 	SrcIP        string           `json:"src_ip"`
 	SrcPort      int              `json:"src_port"`
 	DstIP        string           `json:"dst_ip,omitempty"`
 	DstPort      int              `json:"dst_port,omitempty"`
 	Correlated   bool             `json:"correlated"`
 	OrphanSide   string           `json:"orphan_side,omitempty"`
 	Apache       map[string]any   `json:"apache,omitempty"`
 	Network      map[string]any   `json:"network,omitempty"`
 	Extra        map[string]any   `json:"extra,omitempty"`
 }
 // NewCorrelatedLogFromEvent creates a correlated log from a single event (orphan).
 func NewCorrelatedLogFromEvent(event *NormalizedEvent, orphanSide string) CorrelatedLog {
 	return CorrelatedLog{
 		Timestamp:  event.Timestamp,
 		SrcIP:      event.SrcIP,
 		SrcPort:    event.SrcPort,
 		DstIP:      event.DstIP,
 		DstPort:    event.DstPort,
 		Correlated: false,
 		OrphanSide: orphanSide,
 		Apache:     extractApache(event),
 		Network:    extractNetwork(event),
 		Extra:      make(map[string]any),
 	}
 }
 // NewCorrelatedLog creates a correlated log from two matched events.
 func NewCorrelatedLog(apacheEvent, networkEvent *NormalizedEvent) CorrelatedLog {
 	ts := apacheEvent.Timestamp
 	if networkEvent.Timestamp.After(ts) {
 		ts = networkEvent.Timestamp
 	}
 	return CorrelatedLog{
 		Timestamp:  ts,
 		SrcIP:      apacheEvent.SrcIP,
 		SrcPort:    apacheEvent.SrcPort,
 		DstIP:      coalesceString(apacheEvent.DstIP, networkEvent.DstIP),
 		DstPort:    coalesceInt(apacheEvent.DstPort, networkEvent.DstPort),
 		Correlated: true,
 		OrphanSide: "",
 		Apache:     extractApache(apacheEvent),
 		Network:    extractNetwork(networkEvent),
 		Extra:      make(map[string]any),
 	}
 }
 func extractApache(e *NormalizedEvent) map[string]any {
 	if e.Source != SourceA {
 		return nil
 	}
 	result := make(map[string]any)
 	for k, v := range e.Raw {
 		result[k] = v
 	}
 	return result
 }
 func extractNetwork(e *NormalizedEvent) map[string]any {
 	if e.Source != SourceB {
 		return nil
 	}
 	result := make(map[string]any)
 	for k, v := range e.Raw {
 		result[k] = v
 	}
 	return result
 }
 func coalesceString(a, b string) string {
 	if a != "" {
 		return a
 	}
 	return b
 }
 func coalesceInt(a, b int) int {
 	if a != 0 {
 		return a
 	}
 	return b
 }
--- a/internal/domain/correlated_log_test.go
+++ b/internal/domain/correlated_log_test.go
@ -0,0 +1,115 @@
 package domain
 import (
 	"testing"
 	"time"
 )
 func TestNormalizedEvent_CorrelationKeyFull(t *testing.T) {
 	tests := []struct {
 		name     string
 		event    *NormalizedEvent
 		expected string
 	}{
 		{
 			name: "basic key",
 			event: &NormalizedEvent{
 				SrcIP:   "192.168.1.1",
 				SrcPort: 8080,
 			},
 			expected: "192.168.1.1:8080",
 		},
 		{
 			name: "different port",
 			event: &NormalizedEvent{
 				SrcIP:   "10.0.0.1",
 				SrcPort: 443,
 			},
 			expected: "10.0.0.1:443",
 		},
 		{
 			name: "port zero",
 			event: &NormalizedEvent{
 				SrcIP:   "127.0.0.1",
 				SrcPort: 0,
 			},
 			expected: "127.0.0.1:0",
 		},
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
 			key := tt.event.CorrelationKeyFull()
 			if key != tt.expected {
 				t.Errorf("expected %s, got %s", tt.expected, key)
 			}
 		})
 	}
 }
 func TestNewCorrelatedLogFromEvent(t *testing.T) {
 	event := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC),
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		DstIP:     "10.0.0.1",
 		DstPort:   80,
 		Raw: map[string]any{
 			"method": "GET",
 			"path":   "/api/test",
 		},
 	}
 	log := NewCorrelatedLogFromEvent(event, "A")
 	if log.Correlated {
 		t.Error("expected correlated to be false")
 	}
 	if log.OrphanSide != "A" {
 		t.Errorf("expected orphan_side A, got %s", log.OrphanSide)
 	}
 	if log.SrcIP != "192.168.1.1" {
 		t.Errorf("expected src_ip 192.168.1.1, got %s", log.SrcIP)
 	}
 	if log.Apache == nil {
 		t.Error("expected apache to be non-nil")
 	}
 }
 func TestNewCorrelatedLog(t *testing.T) {
 	apacheEvent := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC),
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		DstIP:     "10.0.0.1",
 		DstPort:   80,
 		Raw:       map[string]any{"method": "GET"},
 	}
 	networkEvent := &NormalizedEvent{
 		Source:    SourceB,
 		Timestamp: time.Date(2024, 1, 1, 12, 0, 0, 500000000, time.UTC),
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		DstIP:     "10.0.0.1",
 		DstPort:   80,
 		Raw:       map[string]any{"ja3": "abc123"},
 	}
 	log := NewCorrelatedLog(apacheEvent, networkEvent)
 	if !log.Correlated {
 		t.Error("expected correlated to be true")
 	}
 	if log.OrphanSide != "" {
 		t.Errorf("expected orphan_side to be empty, got %s", log.OrphanSide)
 	}
 	if log.Apache == nil {
 		t.Error("expected apache to be non-nil")
 	}
 	if log.Network == nil {
 		t.Error("expected network to be non-nil")
 	}
 }
--- a/internal/domain/correlation_service.go
+++ b/internal/domain/correlation_service.go
@ -0,0 +1,243 @@
 package domain
 import (
 	"container/list"
 	"sync"
 	"time"
 )
 const (
 	// DefaultMaxBufferSize is the default maximum number of events per buffer
 	DefaultMaxBufferSize = 10000
 )
 // CorrelationConfig holds the correlation configuration.
 type CorrelationConfig struct {
 	TimeWindow       time.Duration
 	ApacheAlwaysEmit bool
 	NetworkEmit      bool
 	MaxBufferSize    int // Maximum events to buffer per source
 }
 // CorrelationService handles the correlation logic between source A and B events.
 type CorrelationService struct {
 	config       CorrelationConfig
 	mu           sync.Mutex
 	bufferA      *eventBuffer
 	bufferB      *eventBuffer
 	pendingA     map[string]*list.Element // key -> list element containing NormalizedEvent
 	pendingB     map[string]*list.Element
 	timeProvider TimeProvider
 }
 type eventBuffer struct {
 	events *list.List
 }
 func newEventBuffer() *eventBuffer {
 	return &eventBuffer{
 		events: list.New(),
 	}
 }
 // TimeProvider abstracts time for testability.
 type TimeProvider interface {
 	Now() time.Time
 }
 // RealTimeProvider uses real system time.
 type RealTimeProvider struct{}
 func (p *RealTimeProvider) Now() time.Time {
 	return time.Now()
 }
 // NewCorrelationService creates a new correlation service.
 func NewCorrelationService(config CorrelationConfig, timeProvider TimeProvider) *CorrelationService {
 	if timeProvider == nil {
 		timeProvider = &RealTimeProvider{}
 	}
 	if config.MaxBufferSize <= 0 {
 		config.MaxBufferSize = DefaultMaxBufferSize
 	}
 	return &CorrelationService{
 		config:       config,
 		bufferA:      newEventBuffer(),
 		bufferB:      newEventBuffer(),
 		pendingA:     make(map[string]*list.Element),
 		pendingB:     make(map[string]*list.Element),
 		timeProvider: timeProvider,
 	}
 }
 // ProcessEvent processes an incoming event and returns correlated logs if matches are found.
 func (s *CorrelationService) ProcessEvent(event *NormalizedEvent) []CorrelatedLog {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	// Clean expired events first
 	s.cleanExpired()
 	// Check buffer overflow before adding
 	if s.isBufferFull(event.Source) {
 		// Buffer full, drop event or emit as orphan
 		if event.Source == SourceA && s.config.ApacheAlwaysEmit {
 			return []CorrelatedLog{NewCorrelatedLogFromEvent(event, "A")}
 		}
 		return nil
 	}
 	var results []CorrelatedLog
 	switch event.Source {
 	case SourceA:
 		results = s.processSourceA(event)
 	case SourceB:
 		results = s.processSourceB(event)
 	}
 	// Add the new event to the appropriate buffer
 	s.addEvent(event)
 	return results
 }
 func (s *CorrelationService) isBufferFull(source EventSource) bool {
 	switch source {
 	case SourceA:
 		return s.bufferA.events.Len() >= s.config.MaxBufferSize
 	case SourceB:
 		return s.bufferB.events.Len() >= s.config.MaxBufferSize
 	}
 	return false
 }
 func (s *CorrelationService) processSourceA(event *NormalizedEvent) []CorrelatedLog {
 	key := event.CorrelationKeyFull()
 	// Look for a matching B event
 	if elem, ok := s.pendingB[key]; ok {
 		bEvent := elem.Value.(*NormalizedEvent)
 		if s.eventsMatch(event, bEvent) {
 			// Found a match!
 			correlated := NewCorrelatedLog(event, bEvent)
 			s.bufferB.events.Remove(elem)
 			delete(s.pendingB, key)
 			return []CorrelatedLog{correlated}
 		}
 	}
 	// No match found
 	if s.config.ApacheAlwaysEmit {
 		orphan := NewCorrelatedLogFromEvent(event, "A")
 		return []CorrelatedLog{orphan}
 	}
 	// Keep in buffer for potential future match
 	return nil
 }
 func (s *CorrelationService) processSourceB(event *NormalizedEvent) []CorrelatedLog {
 	key := event.CorrelationKeyFull()
 	// Look for a matching A event
 	if elem, ok := s.pendingA[key]; ok {
 		aEvent := elem.Value.(*NormalizedEvent)
 		if s.eventsMatch(aEvent, event) {
 			// Found a match!
 			correlated := NewCorrelatedLog(aEvent, event)
 			s.bufferA.events.Remove(elem)
 			delete(s.pendingA, key)
 			return []CorrelatedLog{correlated}
 		}
 	}
 	// No match found - B is never emitted alone per spec
 	if s.config.NetworkEmit {
 		orphan := NewCorrelatedLogFromEvent(event, "B")
 		return []CorrelatedLog{orphan}
 	}
 	// Keep in buffer for potential future match (but won't be emitted alone)
 	return nil
 }
 func (s *CorrelationService) eventsMatch(a, b *NormalizedEvent) bool {
 	diff := a.Timestamp.Sub(b.Timestamp)
 	if diff < 0 {
 		diff = -diff
 	}
 	return diff <= s.config.TimeWindow
 }
 func (s *CorrelationService) addEvent(event *NormalizedEvent) {
 	key := event.CorrelationKeyFull()
 	switch event.Source {
 	case SourceA:
 		elem := s.bufferA.events.PushBack(event)
 		s.pendingA[key] = elem
 	case SourceB:
 		elem := s.bufferB.events.PushBack(event)
 		s.pendingB[key] = elem
 	}
 }
 func (s *CorrelationService) cleanExpired() {
 	now := s.timeProvider.Now()
 	cutoff := now.Add(-s.config.TimeWindow)
 	// Clean expired events from both buffers using shared logic
 	s.cleanBuffer(s.bufferA, s.pendingA, cutoff)
 	s.cleanBuffer(s.bufferB, s.pendingB, cutoff)
 }
 // cleanBuffer removes expired events from a buffer (shared logic for A and B).
 func (s *CorrelationService) cleanBuffer(buffer *eventBuffer, pending map[string]*list.Element, cutoff time.Time) {
 	for elem := buffer.events.Front(); elem != nil; {
 		event := elem.Value.(*NormalizedEvent)
 		if event.Timestamp.Before(cutoff) {
 			next := elem.Next()
 			key := event.CorrelationKeyFull()
 			buffer.events.Remove(elem)
 			if pending[key] == elem {
 				delete(pending, key)
 			}
 			elem = next
 		} else {
 			break // Events are ordered, so we can stop early
 		}
 	}
 }
 // Flush forces emission of remaining buffered events (for shutdown).
 func (s *CorrelationService) Flush() []CorrelatedLog {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	var results []CorrelatedLog
 	// Emit remaining A events as orphans if configured
 	if s.config.ApacheAlwaysEmit {
 		for elem := s.bufferA.events.Front(); elem != nil; elem = elem.Next() {
 			event := elem.Value.(*NormalizedEvent)
 			orphan := NewCorrelatedLogFromEvent(event, "A")
 			results = append(results, orphan)
 		}
 	}
 	// Clear buffers
 	s.bufferA.events.Init()
 	s.bufferB.events.Init()
 	s.pendingA = make(map[string]*list.Element)
 	s.pendingB = make(map[string]*list.Element)
 	return results
 }
 // GetBufferSizes returns the current buffer sizes (for monitoring).
 func (s *CorrelationService) GetBufferSizes() (int, int) {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	return s.bufferA.events.Len(), s.bufferB.events.Len()
 }
--- a/internal/domain/correlation_service_test.go
+++ b/internal/domain/correlation_service_test.go
@ -0,0 +1,153 @@
 package domain
 import (
 	"testing"
 	"time"
 )
 type mockTimeProvider struct {
 	now time.Time
 }
 func (m *mockTimeProvider) Now() time.Time {
 	return m.now
 }
 func TestCorrelationService_Match(t *testing.T) {
 	now := time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC)
 	timeProvider := &mockTimeProvider{now: now}
 	config := CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: false, // Don't emit A immediately to test matching
 		NetworkEmit:      false,
 	}
 	svc := NewCorrelationService(config, timeProvider)
 	// Send Apache event (should be buffered, not emitted)
 	apacheEvent := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: now,
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		Raw:       map[string]any{"method": "GET"},
 	}
 	results := svc.ProcessEvent(apacheEvent)
 	if len(results) != 0 {
 		t.Fatalf("expected 0 results (buffered), got %d", len(results))
 	}
 	// Send matching Network event within window
 	networkEvent := &NormalizedEvent{
 		Source:    SourceB,
 		Timestamp: now.Add(500 * time.Millisecond),
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 		Raw:       map[string]any{"ja3": "abc"},
 	}
 	// This should match and return correlated log
 	results = svc.ProcessEvent(networkEvent)
 	if len(results) != 1 {
 		t.Errorf("expected 1 result (correlated), got %d", len(results))
 	} else if !results[0].Correlated {
 		t.Error("expected correlated result")
 	}
 }
 func TestCorrelationService_NoMatch_DifferentIP(t *testing.T) {
 	now := time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC)
 	timeProvider := &mockTimeProvider{now: now}
 	config := CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: true,
 		NetworkEmit:      false,
 	}
 	svc := NewCorrelationService(config, timeProvider)
 	apacheEvent := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: now,
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 	}
 	networkEvent := &NormalizedEvent{
 		Source:    SourceB,
 		Timestamp: now,
 		SrcIP:     "192.168.1.2", // Different IP
 		SrcPort:   8080,
 	}
 	svc.ProcessEvent(apacheEvent)
 	results := svc.ProcessEvent(networkEvent)
 	if len(results) != 0 {
 		t.Errorf("expected 0 results (different IP), got %d", len(results))
 	}
 }
 func TestCorrelationService_NoMatch_TimeWindowExceeded(t *testing.T) {
 	now := time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC)
 	timeProvider := &mockTimeProvider{now: now}
 	config := CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: true,
 		NetworkEmit:      false,
 	}
 	svc := NewCorrelationService(config, timeProvider)
 	apacheEvent := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: now,
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 	}
 	networkEvent := &NormalizedEvent{
 		Source:    SourceB,
 		Timestamp: now.Add(2 * time.Second), // Outside window
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 	}
 	svc.ProcessEvent(apacheEvent)
 	results := svc.ProcessEvent(networkEvent)
 	if len(results) != 0 {
 		t.Errorf("expected 0 results (time window exceeded), got %d", len(results))
 	}
 }
 func TestCorrelationService_Flush(t *testing.T) {
 	now := time.Date(2024, 1, 1, 12, 0, 0, 0, time.UTC)
 	timeProvider := &mockTimeProvider{now: now}
 	config := CorrelationConfig{
 		TimeWindow:       time.Second,
 		ApacheAlwaysEmit: true,
 		NetworkEmit:      false,
 	}
 	svc := NewCorrelationService(config, timeProvider)
 	apacheEvent := &NormalizedEvent{
 		Source:    SourceA,
 		Timestamp: now,
 		SrcIP:     "192.168.1.1",
 		SrcPort:   8080,
 	}
 	svc.ProcessEvent(apacheEvent)
 	flushed := svc.Flush()
 	if len(flushed) != 1 {
 		t.Errorf("expected 1 flushed event, got %d", len(flushed))
 	}
 }
--- a/internal/domain/event.go
+++ b/internal/domain/event.go
@ -0,0 +1,37 @@
 package domain
 import (
 	"strconv"
 	"time"
 )
 // EventSource identifies the source of an event.
 type EventSource string
 const (
 	SourceA EventSource = "A" // Apache/HTTP source
 	SourceB EventSource = "B" // Network source
 )
 // NormalizedEvent represents a unified internal event from either source.
 type NormalizedEvent struct {
 	Source    EventSource
 	Timestamp time.Time
 	SrcIP     string
 	SrcPort   int
 	DstIP     string
 	DstPort   int
 	Headers   map[string]string
 	Extra     map[string]any
 	Raw       map[string]any // Original raw data
 }
 // CorrelationKey returns the key used for correlation (src_ip + src_port).
 func (e *NormalizedEvent) CorrelationKey() string {
 	return e.SrcIP + ":" + strconv.Itoa(e.SrcPort)
 }
 // CorrelationKeyFull returns a proper correlation key (alias for clarity).
 func (e *NormalizedEvent) CorrelationKeyFull() string {
 	return e.CorrelationKey()
 }
--- a/internal/observability/logger.go
+++ b/internal/observability/logger.go
@ -0,0 +1,85 @@
 package observability
 import (
 	"log"
 	"os"
 	"sync"
 )
 // Logger provides structured logging.
 type Logger struct {
 	mu       sync.Mutex
 	logger   *log.Logger
 	prefix   string
 	fields   map[string]any
 }
 // NewLogger creates a new logger.
 func NewLogger(prefix string) *Logger {
 	return &Logger{
 		logger: log.New(os.Stderr, "", log.LstdFlags|log.Lmicroseconds),
 		prefix: prefix,
 		fields: make(map[string]any),
 	}
 }
 // WithFields returns a new logger with additional fields.
 func (l *Logger) WithFields(fields map[string]any) *Logger {
 	newLogger := &Logger{
 		logger: l.logger,
 		prefix: l.prefix,
 		fields: make(map[string]any),
 	}
 	for k, v := range l.fields {
 		newLogger.fields[k] = v
 	}
 	for k, v := range fields {
 		newLogger.fields[k] = v
 	}
 	return newLogger
 }
 // Info logs an info message.
 func (l *Logger) Info(msg string) {
 	l.mu.Lock()
 	defer l.mu.Unlock()
 	l.log("INFO", msg)
 }
 // Error logs an error message.
 func (l *Logger) Error(msg string, err error) {
 	l.mu.Lock()
 	defer l.mu.Unlock()
 	if err != nil {
 		l.log("ERROR", msg+" "+err.Error())
 	} else {
 		l.log("ERROR", msg)
 	}
 }
 // Debug logs a debug message.
 func (l *Logger) Debug(msg string) {
 	l.mu.Lock()
 	defer l.mu.Unlock()
 	l.log("DEBUG", msg)
 }
 func (l *Logger) log(level, msg string) {
 	prefix := l.prefix
 	if prefix != "" {
 		prefix = "[" + prefix + "] "
 	}
 	l.logger.SetPrefix(prefix + level + " ")
 	var args []any
 	for k, v := range l.fields {
 		args = append(args, k, v)
 	}
 	if len(args) > 0 {
 		l.logger.Printf(msg+" %+v", args...)
 	} else {
 		l.logger.Print(msg)
 	}
 }
--- a/internal/observability/logger_test.go
+++ b/internal/observability/logger_test.go
@ -0,0 +1,111 @@
 package observability
 import (
 	"bytes"
 	"io"
 	"os"
 	"strings"
 	"testing"
 )
 func TestNewLogger(t *testing.T) {
 	logger := NewLogger("test")
 	if logger == nil {
 		t.Fatal("expected non-nil logger")
 	}
 	if logger.prefix != "test" {
 		t.Errorf("expected prefix 'test', got %s", logger.prefix)
 	}
 }
 func TestLogger_Info(t *testing.T) {
 	// Capture stderr
 	oldStderr := os.Stderr
 	r, w, _ := os.Pipe()
 	os.Stderr = w
 	logger := NewLogger("test")
 	logger.Info("test message")
 	w.Close()
 	os.Stderr = oldStderr
 	var buf bytes.Buffer
 	io.Copy(&buf, r)
 	output := buf.String()
 	if !strings.Contains(output, "INFO") {
 		t.Error("expected INFO in output")
 	}
 	if !strings.Contains(output, "test message") {
 		t.Error("expected 'test message' in output")
 	}
 }
 func TestLogger_Error(t *testing.T) {
 	oldStderr := os.Stderr
 	r, w, _ := os.Pipe()
 	os.Stderr = w
 	logger := NewLogger("test")
 	logger.Error("error message", nil)
 	w.Close()
 	os.Stderr = oldStderr
 	var buf bytes.Buffer
 	io.Copy(&buf, r)
 	output := buf.String()
 	if !strings.Contains(output, "ERROR") {
 		t.Error("expected ERROR in output")
 	}
 	if !strings.Contains(output, "error message") {
 		t.Error("expected 'error message' in output")
 	}
 }
 func TestLogger_Debug(t *testing.T) {
 	oldStderr := os.Stderr
 	r, w, _ := os.Pipe()
 	os.Stderr = w
 	logger := NewLogger("test")
 	logger.Debug("debug message")
 	w.Close()
 	os.Stderr = oldStderr
 	var buf bytes.Buffer
 	io.Copy(&buf, r)
 	output := buf.String()
 	if !strings.Contains(output, "DEBUG") {
 		t.Error("expected DEBUG in output")
 	}
 	if !strings.Contains(output, "debug message") {
 		t.Error("expected 'debug message' in output")
 	}
 }
 func TestLogger_WithFields(t *testing.T) {
 	logger := NewLogger("test")
 	fieldsLogger := logger.WithFields(map[string]any{
 		"key1": "value1",
 		"key2": 42,
 	})
 	if fieldsLogger == logger {
 		t.Error("expected different logger instance")
 	}
 	if len(fieldsLogger.fields) != 2 {
 		t.Errorf("expected 2 fields, got %d", len(fieldsLogger.fields))
 	}
 }
 func TestLogger_Name(t *testing.T) {
 	logger := NewLogger("myservice")
 	if logger.prefix != "myservice" {
 		t.Errorf("expected prefix 'myservice', got %s", logger.prefix)
 	}
 }
--- a/internal/ports/source.go
+++ b/internal/ports/source.go
@ -0,0 +1,54 @@
 package ports
 import (
 	"context"
 	"time"
 	"github.com/logcorrelator/logcorrelator/internal/domain"
 )
 // EventSource defines the interface for log sources.
 type EventSource interface {
 	// Start begins reading events and sending them to the channel.
 	// Returns an error if the source cannot be started.
 	Start(ctx context.Context, eventChan chan<- *domain.NormalizedEvent) error
 	// Stop gracefully stops the source.
 	Stop() error
 	// Name returns the source name.
 	Name() string
 }
 // CorrelatedLogSink defines the interface for correlated log destinations.
 type CorrelatedLogSink interface {
 	// Write sends a correlated log to the sink.
 	Write(ctx context.Context, log domain.CorrelatedLog) error
 	// Flush flushes any buffered logs.
 	Flush(ctx context.Context) error
 	// Close closes the sink.
 	Close() error
 	// Name returns the sink name.
 	Name() string
 }
 // TimeProvider abstracts time for testability.
 type TimeProvider interface {
 	Now() time.Time
 }
 // CorrelationProcessor defines the interface for the correlation service.
 // This allows for easier testing and alternative implementations.
 type CorrelationProcessor interface {
 	// ProcessEvent processes an incoming event and returns correlated logs.
 	ProcessEvent(event *domain.NormalizedEvent) []domain.CorrelatedLog
 	// Flush forces emission of remaining buffered events.
 	Flush() []domain.CorrelatedLog
 	// GetBufferSizes returns the current buffer sizes for monitoring.
 	GetBufferSizes() (int, int)
 }
--- a/logcorrelator.service
+++ b/logcorrelator.service
@ -0,0 +1,23 @@
 [Unit]
 Description=logcorrelator service
 After=network.target
 [Service]
 Type=simple
 User=logcorrelator
 Group=logcorrelator
 ExecStart=/usr/bin/logcorrelator -config /etc/logcorrelator/logcorrelator.conf
 Restart=on-failure
 RestartSec=5
 # Security hardening
 NoNewPrivileges=true
 ProtectSystem=strict
 ProtectHome=true
 ReadWritePaths=/var/log/logcorrelator /var/run/logcorrelator
 # Resource limits
 LimitNOFILE=65536
 [Install]
 WantedBy=multi-user.target
--- a/packaging/deb/postinst
+++ b/packaging/deb/postinst
@ -0,0 +1,66 @@
 #!/bin/bash
 set -e
 # postinst script for logcorrelator .deb package
 case "$1" in
    configure)
        # Create logcorrelator user and group if they don't exist
        if ! getent group logcorrelator > /dev/null 2>&1; then
            groupadd --system logcorrelator
        fi
        if ! getent passwd logcorrelator > /dev/null 2>&1; then
            useradd --system \
                --gid logcorrelator \
                --home-dir /var/lib/logcorrelator \
                --no-create-home \
                --shell /usr/sbin/nologin \
                logcorrelator
        fi
        # Create necessary directories
        mkdir -p /var/lib/logcorrelator
        mkdir -p /var/run/logcorrelator
        mkdir -p /var/log/logcorrelator
        mkdir -p /etc/logcorrelator
        # Set proper ownership
        chown -R logcorrelator:logcorrelator /var/lib/logcorrelator
        chown -R logcorrelator:logcorrelator /var/run/logcorrelator
        chown -R logcorrelator:logcorrelator /var/log/logcorrelator
        chown -R logcorrelator:logcorrelator /etc/logcorrelator
        # Set proper permissions
        chmod 750 /var/lib/logcorrelator
        chmod 750 /var/log/logcorrelator
        chmod 750 /etc/logcorrelator
        # Install default config if it doesn't exist
        if [ ! -f /etc/logcorrelator/logcorrelator.conf ]; then
            cp /usr/share/logcorrelator/logcorrelator.conf.example /etc/logcorrelator/logcorrelator.conf
            chown logcorrelator:logcorrelator /etc/logcorrelator/logcorrelator.conf
            chmod 640 /etc/logcorrelator/logcorrelator.conf
        fi
        # Enable and start the service (if running in a real system, not container)
        if [ -x /bin/systemctl ] && [ -d /run/systemd/system ]; then
            systemctl daemon-reload
            systemctl enable logcorrelator.service
            if ! systemctl is-active --quiet logcorrelator.service; then
                systemctl start logcorrelator.service
            fi
        fi
        ;;
    abort-upgrade|abort-remove|abort-deconfigure)
        # On abort, do nothing special
        ;;
    *)
        echo "postinst called with unknown argument '$1'" >&2
        exit 1
        ;;
 esac
 exit 0
--- a/packaging/deb/postrm
+++ b/packaging/deb/postrm
@ -0,0 +1,52 @@
 #!/bin/bash
 set -e
 # postrm script for logcorrelator .deb package
 case "$1" in
    remove)
        # On remove, leave config and data files
        ;;
    purge)
        # On purge, remove everything
        # Stop service if running
        if [ -x /bin/systemctl ] && [ -d /run/systemd/system ]; then
            systemctl stop logcorrelator.service 2>/dev/null || true
            systemctl disable logcorrelator.service 2>/dev/null || true
            systemctl daemon-reload
        fi
        # Remove configuration
        rm -rf /etc/logcorrelator
        # Remove data and logs
        rm -rf /var/lib/logcorrelator
        rm -rf /var/log/logcorrelator
        rm -rf /var/run/logcorrelator
        # Remove user and group
        if getent passwd logcorrelator > /dev/null 2>&1; then
            userdel logcorrelator 2>/dev/null || true
        fi
        if getent group logcorrelator > /dev/null 2>&1; then
            groupdel logcorrelator 2>/dev/null || true
        fi
        ;;
    abort-upgrade|abort-remove|abort-deconfigure)
        # On abort, restart the service
        if [ -x /bin/systemctl ] && [ -d /run/systemd/system ]; then
            systemctl start logcorrelator.service 2>/dev/null || true
        fi
        ;;
    *)
        echo "postrm called with unknown argument '$1'" >&2
        exit 1
        ;;
 esac
 exit 0
--- a/packaging/deb/prerm
+++ b/packaging/deb/prerm
@ -0,0 +1,29 @@
 #!/bin/bash
 set -e
 # prerm script for logcorrelator .deb package
 case "$1" in
    remove|deconfigure)
        # Stop and disable the service
        if [ -x /bin/systemctl ] && [ -d /run/systemd/system ]; then
            systemctl stop logcorrelator.service 2>/dev/null || true
            systemctl disable logcorrelator.service 2>/dev/null || true
            systemctl daemon-reload
        fi
        ;;
    upgrade)
        # On upgrade, just stop the service (will be restarted by postinst)
        if [ -x /bin/systemctl ] && [ -d /run/systemd/system ]; then
            systemctl stop logcorrelator.service 2>/dev/null || true
        fi
        ;;
    *)
        echo "prerm called with unknown argument '$1'" >&2
        exit 1
        ;;
 esac
 exit 0
--- a/test.sh
+++ b/test.sh
@ -0,0 +1,21 @@
 #!/bin/bash
 # Test script - runs all tests in Docker container
 set -e
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 cd "$SCRIPT_DIR"
 echo "=============================================="
 echo "  logcorrelator - Test Suite (Docker)"
 echo "=============================================="
 echo ""
 # Build test image and run tests
 docker build \
    --target builder \
    -t logcorrelator-test:latest \
    -f Dockerfile .
 echo ""
 echo "Tests completed successfully!"
 echo ""
		`@ -0,0 +1,3 @@`
							`module github.com/logcorrelator/logcorrelator`

							`go 1.21`