From 66b1209486838b12110ae4b2d42479f22c1b2717 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 04:08:40 -0500
Subject: [PATCH 01/26] Fix dropdown duration dirs

---
 scripts/generate_reports.py | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 4c0c911..b9100f4 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -192,12 +192,14 @@ def _generate_all_domains(interval: str) -> None:
 def _generate_root_index() -> None:
     """Render the top-level index listing all intervals and domains."""
     _copy_icons()
-    intervals = [
-        p.name
-        for p in OUTPUT_DIR.iterdir()
-        if p.is_dir() and p.name.lower() not in {"domains", "global", "analysis"}
-    ]
-    intervals.sort()
+    intervals = sorted(
+        [
+            name
+            for name in INTERVAL_FORMATS
+            if (OUTPUT_DIR / name).is_dir()
+        ]
+    )
+
 
     domains_dir = OUTPUT_DIR / "domains"
     domains: List[str] = []

From 87608ccdb91023fb7bdbc2d3674524eae579af94 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 04:17:38 -0500
Subject: [PATCH 02/26] refactor: improve report field names

---
 reports.yml                 | 56 ++++++++++++++++++++++++-------------
 scripts/generate_reports.py |  8 ++++++
 templates/index.html        |  7 +++--
 3 files changed, 49 insertions(+), 22 deletions(-)

diff --git a/reports.yml b/reports.yml
index 1622538..c9b9cd3 100644
--- a/reports.yml
+++ b/reports.yml
@@ -2,30 +2,36 @@
   label: Hits
   icon: pulse
   chart: line
+  bucket: time_bucket
+  bucket_label: Time
   query: |
-    SELECT {bucket} AS bucket,
+    SELECT {bucket} AS time_bucket,
            COUNT(*) AS value
     FROM logs
-    GROUP BY bucket
-    ORDER BY bucket
+    GROUP BY time_bucket
+    ORDER BY time_bucket
 
 - name: error_rate
   label: Error Rate (%)
   icon: file-alert
   chart: line
+  bucket: time_bucket
+  bucket_label: Time
   query: |
-    SELECT {bucket} AS bucket,
+    SELECT {bucket} AS time_bucket,
            SUM(CASE WHEN status BETWEEN 400 AND 599 THEN 1 ELSE 0 END) * 100.0 / COUNT(*) AS value
     FROM logs
-    GROUP BY bucket
-    ORDER BY bucket
+    GROUP BY time_bucket
+    ORDER BY time_bucket
 
 - name: cache_status_breakdown
   label: Cache Status
   icon: archive
   chart: polarArea
+  bucket: cache_status
+  bucket_label: Cache Status
   query: |
-    SELECT cache_status AS bucket,
+    SELECT cache_status AS cache_status,
            COUNT(*) AS value
     FROM logs
     GROUP BY cache_status
@@ -43,30 +49,36 @@
   icon: globe
   chart: table
   per_domain: false
+  bucket: domain
+  bucket_label: Domain
   query: |
-    SELECT host AS bucket,
+    SELECT host AS domain,
            COUNT(*) AS value
     FROM logs
-    GROUP BY host
+    GROUP BY domain
     ORDER BY value DESC
 
 - name: bytes_sent
   label: Bytes Sent
   icon: upload
   chart: line
+  bucket: time_bucket
+  bucket_label: Time
   query: |
-    SELECT {bucket} AS bucket,
+    SELECT {bucket} AS time_bucket,
            SUM(bytes_sent) AS value
     FROM logs
-    GROUP BY bucket
-    ORDER BY bucket
+    GROUP BY time_bucket
+    ORDER BY time_bucket
 
 - name: top_paths
   label: Top Paths
   icon: map
   chart: table
+  bucket: path
+  bucket_label: Path
   query: |
-    SELECT path AS bucket,
+    SELECT path AS path,
            COUNT(*) AS value
     FROM (
         SELECT substr(substr(request, instr(request, ' ') + 1), 1,
@@ -81,8 +93,10 @@
   label: User Agents
   icon: user
   chart: table
+  bucket: user_agent
+  bucket_label: User Agent
   query: |
-    SELECT user_agent AS bucket,
+    SELECT user_agent AS user_agent,
            COUNT(*) AS value
     FROM logs
     GROUP BY user_agent
@@ -93,11 +107,13 @@
   label: Referrers
   icon: link
   chart: table
+  bucket: referrer
+  bucket_label: Referrer
   query: |
-    SELECT referer AS bucket,
+    SELECT referer AS referrer,
            COUNT(*) AS value
     FROM logs
-    GROUP BY referer
+    GROUP BY referrer
     ORDER BY value DESC
     LIMIT 20
 
@@ -105,17 +121,19 @@
   label: HTTP Statuses
   icon: server
   chart: pie
+  bucket: status_group
+  bucket_label: Status
   query: |
     SELECT CASE
              WHEN status BETWEEN 200 AND 299 THEN '2xx'
              WHEN status BETWEEN 300 AND 399 THEN '3xx'
              WHEN status BETWEEN 400 AND 499 THEN '4xx'
              ELSE '5xx'
-           END AS bucket,
+           END AS status_group,
            COUNT(*) AS value
     FROM logs
-    GROUP BY bucket
-    ORDER BY bucket
+    GROUP BY status_group
+    ORDER BY status_group
   colors:
     - "#48c78e"
     - "#209cee"
diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index b9100f4..0a95bdc 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -169,6 +169,10 @@ def _generate_interval(interval: str, domain: Optional[str] = None) -> None:
         }
         if "icon" in definition:
             entry["icon"] = definition["icon"]
+        if "bucket" in definition:
+            entry["bucket"] = definition["bucket"]
+        if "bucket_label" in definition:
+            entry["bucket_label"] = definition["bucket_label"]
         if "color" in definition:
             entry["color"] = definition["color"]
         if "colors" in definition:
@@ -253,6 +257,10 @@ def _generate_global() -> None:
         }
         if "icon" in definition:
             entry["icon"] = definition["icon"]
+        if "bucket" in definition:
+            entry["bucket"] = definition["bucket"]
+        if "bucket_label" in definition:
+            entry["bucket_label"] = definition["bucket_label"]
         if "color" in definition:
             entry["color"] = definition["color"]
         if "colors" in definition:
diff --git a/templates/index.html b/templates/index.html
index 237f563..4db9e53 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -105,19 +105,20 @@
       fetch(base + '/' + rep.json)
         .then(r => r.json())
         .then(data => {
+          const bucketField = rep.bucket || 'bucket';
           if (rep.chart === 'table') {
-            const rows = data.map(x => [x.bucket, x.value]);
+            const rows = data.map(x => [x[bucketField], x.value]);
             new DataTable('#table-' + rep.name, {
               data: rows,
               columns: [
-                { title: 'Bucket' },
+                { title: rep.bucket_label || 'Bucket' },
                 { title: 'Value' }
               ]
             });
             return;
           }
 
-          const labels = data.map(x => x.bucket);
+          const labels = data.map(x => x[bucketField]);
           const values = data.map(x => x.value);
           const chartType = rep.chart === 'stackedBar' ? 'bar' : rep.chart;
           const options = { scales: { y: { beginAtZero: true } } };

From 832a0a49dde1611dad0f39f8cb6221249dc9823b Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 04:31:13 -0500
Subject: [PATCH 03/26] docs: refresh README and agent guide

---
 AGENTS.md |  12 +++++
 README.md | 141 ++++++++++++++++++++++--------------------------------
 2 files changed, 70 insertions(+), 83 deletions(-)

diff --git a/AGENTS.md b/AGENTS.md
index 4cdfa62..7e7d3c5 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -24,6 +24,9 @@ This document outlines general practices and expectations for AI agents assistin
   The `run-import.sh` script can initialize this environment automatically.
   Always activate the virtual environment before running scripts or tests.
 
+* Before committing code run `black` for consistent formatting and execute
+  the test suite with `pytest`. All tests should pass.
+
 * Dependency management: Use `requirements.txt` or `pip-tools`
 * Use standard libraries where feasible (e.g., `sqlite3`, `argparse`, `datetime`)
 * Adopt `typer` for CLI command interface (if CLI ergonomics matter)
@@ -89,6 +92,14 @@ ngxstat/
 
 If uncertain, the agent should prompt the human for clarification before making architectural assumptions.
 
+## Testing
+
+Use `pytest` for automated tests. Run the suite from an activated virtual environment and ensure all tests pass before committing:
+
+```bash
+pytest -q
+```
+
 ---
 
 ## Future Capabilities
@@ -106,3 +117,4 @@ As the project matures, agents may also:
 
 * **2025-07-17**: Initial version by Jordan + ChatGPT
 * **2025-07-17**: Expanded virtual environment usage guidance
+
diff --git a/README.md b/README.md
index acb1055..f641d96 100644
--- a/README.md
+++ b/README.md
@@ -1,11 +1,16 @@
 # ngxstat
-Per-domain Nginx log analytics with hybrid static reports and live insights.
 
-## Generating Reports
+`ngxstat` is a lightweight log analytics toolkit for Nginx. It imports access
+logs into an SQLite database and renders static dashboards so you can explore
+per-domain metrics without running a heavy backend service.
 
-Use the `generate_reports.py` script to build aggregated JSON and HTML snippet files from `database/ngxstat.db`.
+## Requirements
 
-Create a virtual environment and install dependencies:
+* Python 3.10+
+* Access to the Nginx log files (default: `/var/log/nginx`)
+
+The helper scripts create a virtual environment on first run, but you can also
+set one up manually:
 
 ```bash
 python3 -m venv .venv
@@ -13,118 +18,88 @@ source .venv/bin/activate
 pip install -r requirements.txt
 ```
 
-Then run one or more of the interval commands:
-
-```bash
-python scripts/generate_reports.py hourly
-python scripts/generate_reports.py daily
-python scripts/generate_reports.py weekly
-python scripts/generate_reports.py monthly
-```
-
-Each command accepts optional flags to generate per-domain reports. Use
-`--domain <name>` to limit output to a specific domain or `--all-domains`
-to generate a subdirectory for every domain found in the database:
-
-```bash
-# Hourly reports for example.com only
-python scripts/generate_reports.py hourly --domain example.com
-
-# Weekly reports for all domains individually
-python scripts/generate_reports.py weekly --all-domains
-```
-
-Reports are written under the `output/` directory. Each command updates the corresponding `<interval>.json` file and writes one HTML snippet per report. These snippets are loaded dynamically by the main dashboard using Chart.js and DataTables.
-
-### Configuring Reports
-
-Report queries are defined in `reports.yml`. Each entry specifies the `name`,
-optional `label` and `chart` type, and a SQL `query` that must return `bucket`
-and `value` columns. The special token `{bucket}` is replaced with the
-appropriate SQLite `strftime` expression for each interval (hourly, daily,
-weekly or monthly) so that a single definition works across all durations.
-When `generate_reports.py` runs, every definition is executed for the requested
-interval and creates `output/<interval>/<name>.json` plus a small HTML snippet
-`output/<interval>/<name>.html` used by the dashboard.
-
-Example snippet:
-
-```yaml
-- name: hits
-  chart: bar
-  query: |
-    SELECT {bucket} AS bucket,
-           COUNT(*) AS value
-    FROM logs
-    GROUP BY bucket
-    ORDER BY bucket
-```
-
-Add or modify entries in `reports.yml` to tailor the generated metrics.
-
 ## Importing Logs
 
-Use the `run-import.sh` script to set up the Python environment if needed and import the latest Nginx log entries into `database/ngxstat.db`.
+Run the importer to ingest new log entries into `database/ngxstat.db`:
 
 ```bash
 ./run-import.sh
 ```
 
-This script is suitable for cron jobs as it creates the virtual environment on first run, installs dependencies and reuses the environment on subsequent runs.
+Rotated logs are processed in order and only entries newer than the last
+imported timestamp are added.
 
-The importer handles rotated logs in order from oldest to newest so entries are
-processed exactly once. If you rerun the script, it only ingests records with a
-timestamp newer than the latest one already stored in the database, preventing
-duplicates.
+## Generating Reports
 
-## Cron Report Generation
-
-Use the `run-reports.sh` script to run all report intervals in one step. The script sets up the Python environment the same way as `run-import.sh`, making it convenient for automation via cron.
+To build the HTML dashboard and JSON data files use `run-reports.sh` which runs
+all intervals in one go:
 
 ```bash
 ./run-reports.sh
 ```
 
-Running this script will create or update the hourly, daily, weekly and monthly reports under `output/`. It also detects all unique domains found in the database and writes per-domain reports to `output/domains/<domain>/<interval>` alongside the aggregate data. After generation, open `output/index.html` in your browser to browse the reports.
+The script calls `scripts/generate_reports.py` internally to create hourly,
+daily, weekly and monthly reports. Per-domain reports are written under
+`output/domains/<domain>` alongside the aggregate data. Open
+`output/index.html` in a browser to view the dashboard.
 
+If you prefer to run individual commands you can invoke the generator directly:
 
-## Log Analysis
+```bash
+python scripts/generate_reports.py hourly
+python scripts/generate_reports.py daily --all-domains
+```
 
-The `run-analysis.sh` script runs helper routines that inspect the database. It
-creates or reuses the virtual environment and then executes a set of analysis
-commands to spot missing domains, suggest cache rules and detect potential
-threats.
+## Analysis Helpers
+
+`run-analysis.sh` executes additional utilities that examine the database for
+missing domains, caching opportunities and potential threats. The JSON output is
+saved under `output/analysis` and appears in the "Analysis" tab of the
+dashboard.
 
 ```bash
 ./run-analysis.sh
 ```
-The JSON results are written under `output/analysis` and can be viewed from the
-"Analysis" tab in the generated dashboard.
-## Serving Reports with Nginx
 
-To expose the generated HTML dashboards and JSON files over HTTP you can use a
-simple Nginx server block. Point the `root` directive to the repository's
-`output/` directory and optionally restrict access to your local network.
+## Serving the Reports
+
+The generated files are static. You can serve them with a simple Nginx block:
 
 ```nginx
 server {
     listen 80;
     server_name example.com;
-
-    # Path to the generated reports
     root /path/to/ngxstat/output;
 
     location / {
         try_files $uri $uri/ =404;
     }
-
-    # Allow access only from private networks
-    allow 192.0.0.0/8;
-    allow 10.0.0.0/8;
-    deny  all;
 }
 ```
 
-With this configuration the generated static files are served directly by
-Nginx while connections outside of `192.*` and `10.*` are denied.
+Restrict access if the reports should not be public.
 
+## Running Tests
+
+Install the development dependencies and execute the suite with `pytest`:
+
+```bash
+pip install -r requirements.txt
+pytest -q
+```
+
+All tests must pass before submitting changes.
+
+## Acknowledgements
+
+ngxstat uses the following third‑party resources:
+
+* [Chart.js](https://www.chartjs.org/) for charts
+* [DataTables](https://datatables.net/) and [jQuery](https://jquery.com/) for table views
+* [Bulma CSS](https://bulma.io/) for styling
+* Icons from [Free CC0 Icons](https://cc0-icons.jonh.eu/) by Jon Hicks (CC0 / MIT)
+* [Typer](https://typer.tiangolo.com/) for the command-line interface
+* [Jinja2](https://palletsprojects.com/p/jinja/) for templating
+
+The project is licensed under the GPLv3. Icon assets remain in the public domain
+via the CC0 license.

From 669b51e03cdea7575ae5c6ee754781b7274c1610 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 04:50:09 -0500
Subject: [PATCH 04/26] Add report generation timing stats

---
 scripts/generate_reports.py | 23 +++++++++++++++--------
 templates/index.html        |  7 +++++++
 tests/test_reports.py       | 20 +++++++++++---------
 3 files changed, 33 insertions(+), 17 deletions(-)

diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 0a95bdc..664a3a5 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -3,6 +3,8 @@ import sqlite3
 from pathlib import Path
 import shutil
 from typing import List, Dict, Optional
+from datetime import datetime
+import time
 
 import yaml
 
@@ -74,7 +76,9 @@ def _render_snippet(report: Dict, out_dir: Path) -> None:
     snippet_path.write_text(template.render(report=report))
 
 
-def _write_stats() -> None:
+def _write_stats(
+    generated_at: Optional[str] = None, generation_seconds: Optional[float] = None
+) -> None:
     """Query basic dataset stats and write them to ``output/global/stats.json``."""
     conn = sqlite3.connect(DB_PATH)
     cur = conn.cursor()
@@ -98,6 +102,10 @@ def _write_stats() -> None:
         "end_date": end_date,
         "unique_domains": unique_domains,
     }
+    if generated_at:
+        stats["generated_at"] = generated_at
+    if generation_seconds is not None:
+        stats["generation_seconds"] = generation_seconds
 
     out_path = OUTPUT_DIR / "global" / "stats.json"
     _save_json(out_path, stats)
@@ -197,14 +205,9 @@ def _generate_root_index() -> None:
     """Render the top-level index listing all intervals and domains."""
     _copy_icons()
     intervals = sorted(
-        [
-            name
-            for name in INTERVAL_FORMATS
-            if (OUTPUT_DIR / name).is_dir()
-        ]
+        [name for name in INTERVAL_FORMATS if (OUTPUT_DIR / name).is_dir()]
     )
 
-
     domains_dir = OUTPUT_DIR / "domains"
     domains: List[str] = []
     if domains_dir.is_dir():
@@ -227,6 +230,9 @@ def _generate_global() -> None:
         typer.echo("No report definitions found")
         return
 
+    start_time = time.time()
+    generated_at = datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S")
+
     _copy_icons()
 
     conn = sqlite3.connect(DB_PATH)
@@ -269,7 +275,8 @@ def _generate_global() -> None:
         report_list.append(entry)
 
     _save_json(out_dir / "reports.json", report_list)
-    _write_stats()
+    elapsed = round(time.time() - start_time, 2)
+    _write_stats(generated_at, elapsed)
     typer.echo("Generated global reports")
 
 
diff --git a/templates/index.html b/templates/index.html
index 4db9e53..472ef25 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -49,6 +49,8 @@
         <p>Total logs: <span id="stat-total">-</span></p>
         <p>Date range: <span id="stat-start">-</span> to <span id="stat-end">-</span></p>
         <p>Unique domains: <span id="stat-domains">-</span></p>
+        <p>Last generated: <span id="stat-generated">-</span></p>
+        <p>Generation time: <span id="stat-elapsed">-</span> seconds</p>
       </div>
       <div id="overview-reports"></div>
     </div>
@@ -96,6 +98,8 @@
     const startElem = document.getElementById('stat-start');
     const endElem = document.getElementById('stat-end');
     const domainsElem = document.getElementById('stat-domains');
+    const generatedElem = document.getElementById('stat-generated');
+    const elapsedElem = document.getElementById('stat-elapsed');
 
     let currentInterval = intervalSelect.value;
     let currentDomain = domainSelect.value;
@@ -161,6 +165,9 @@
           startElem.textContent = stats.start_date;
           endElem.textContent = stats.end_date;
           domainsElem.textContent = stats.unique_domains;
+          generatedElem.textContent = stats.generated_at || '-';
+          elapsedElem.textContent =
+            stats.generation_seconds !== undefined ? stats.generation_seconds : '-';
         });
     }
 
diff --git a/tests/test_reports.py b/tests/test_reports.py
index dbe71c2..75d7737 100644
--- a/tests/test_reports.py
+++ b/tests/test_reports.py
@@ -148,20 +148,19 @@ def test_generate_interval_domain_filter(tmp_path, sample_reports, monkeypatch):
     gr._generate_interval("hourly", "example.com")
 
     hits = json.loads(
-        (tmp_path / "output" / "domains" / "example.com" / "hourly" / "hits.json").read_text()
+        (
+            tmp_path / "output" / "domains" / "example.com" / "hourly" / "hits.json"
+        ).read_text()
     )
     assert hits[0]["value"] == 2
     reports = json.loads(
-        (tmp_path / "output" / "domains" / "example.com" / "hourly" / "reports.json").read_text()
+        (
+            tmp_path / "output" / "domains" / "example.com" / "hourly" / "reports.json"
+        ).read_text()
     )
     assert {r["name"] for r in reports} == {"hits", "error_rate"}
     assert not (
-        tmp_path
-        / "output"
-        / "domains"
-        / "example.com"
-        / "hourly"
-        / "skip_report.json"
+        tmp_path / "output" / "domains" / "example.com" / "hourly" / "skip_report.json"
     ).exists()
 
 
@@ -245,9 +244,12 @@ def test_global_stats_file(tmp_path, sample_reports, monkeypatch):
         "start_date",
         "end_date",
         "unique_domains",
+        "generated_at",
+        "generation_seconds",
     }
     assert stats["total_logs"] == 2
     assert stats["start_date"] == "2024-01-01 10:00:00"
     assert stats["end_date"] == "2024-01-01 10:05:00"
     assert stats["unique_domains"] == 1
-
+    assert isinstance(stats["generated_at"], str)
+    assert stats["generation_seconds"] >= 0

From fb753a1189dbaab3b2d35a63f1b81668933f01ee Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 16:41:58 -0500
Subject: [PATCH 05/26] fix: destroy charts when reloading domain reports

---
 templates/index.html | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/templates/index.html b/templates/index.html
index 472ef25..b1cbf89 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -171,6 +171,15 @@
         });
     }
 
+    function destroyCharts(container) {
+      container.querySelectorAll('canvas').forEach(c => {
+        const chart = Chart.getChart(c);
+        if (chart) {
+          chart.destroy();
+        }
+      });
+    }
+
     function loadReports() {
       let path;
       let container;
@@ -183,6 +192,7 @@
       } else {
         container = containers.domain;
         if (!currentDomain) {
+          destroyCharts(container);
           container.innerHTML = '<p>Select a domain</p>';
           return;
         }
@@ -192,6 +202,7 @@
         fetch(path + '/reports.json')
           .then(r => r.json())
           .then(reports => {
+            destroyCharts(container);
             container.innerHTML = '';
             reports.forEach(rep => {
               fetch(path + '/' + rep.html)

From 297c913f2a314a843f0304baaa8cd2a7bf1ad8e5 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 17:03:48 -0500
Subject: [PATCH 06/26] fix: destroy charts when switching tabs

---
 scripts/analyze.py         | 22 +++++++++++-----------
 scripts/init_db.py         |  4 +++-
 scripts/nginx_config.py    |  1 -
 templates/index.html       |  5 +++++
 tests/test_importer.py     |  5 ++---
 tests/test_nginx_config.py |  1 -
 tests/test_run_analysis.py |  2 +-
 7 files changed, 22 insertions(+), 18 deletions(-)

diff --git a/scripts/analyze.py b/scripts/analyze.py
index 8ac7c30..fe7b818 100644
--- a/scripts/analyze.py
+++ b/scripts/analyze.py
@@ -105,7 +105,9 @@ def hits(domain: Optional[str] = typer.Option(None, help="Filter by domain")) ->
 
 
 @app.command("cache-ratio")
-def cache_ratio_cmd(domain: Optional[str] = typer.Option(None, help="Filter by domain")) -> None:
+def cache_ratio_cmd(
+    domain: Optional[str] = typer.Option(None, help="Filter by domain")
+) -> None:
     """Display cache hit ratio as a percentage."""
     ratio = get_cache_ratio(domain) * 100
     if domain:
@@ -115,7 +117,11 @@ def cache_ratio_cmd(domain: Optional[str] = typer.Option(None, help="Filter by d
 
 
 @app.command("check-missing-domains")
-def check_missing_domains(json_output: bool = typer.Option(False, "--json", help="Output missing domains as JSON")) -> None:
+def check_missing_domains(
+    json_output: bool = typer.Option(
+        False, "--json", help="Output missing domains as JSON"
+    )
+) -> None:
     """Show domains present in the database but absent from Nginx config."""
     try:
         from scripts.generate_reports import _get_domains as _db_domains
@@ -151,9 +157,7 @@ def check_missing_domains(json_output: bool = typer.Option(False, "--json", help
 
 @app.command("suggest-cache")
 def suggest_cache(
-    threshold: int = typer.Option(
-        10, help="Minimum number of MISS entries to report"
-    ),
+    threshold: int = typer.Option(10, help="Minimum number of MISS entries to report"),
     json_output: bool = typer.Option(False, "--json", help="Output results as JSON"),
 ) -> None:
     """Suggest domain/path pairs that could benefit from caching.
@@ -211,9 +215,7 @@ def suggest_cache(
 @app.command("detect-threats")
 def detect_threats(
     hours: int = typer.Option(1, help="Number of recent hours to analyze"),
-    ip_threshold: int = typer.Option(
-        100, help="Requests from a single IP to flag"
-    ),
+    ip_threshold: int = typer.Option(100, help="Requests from a single IP to flag"),
 ) -> None:
     """Detect potential security threats from recent logs."""
 
@@ -316,9 +318,7 @@ def detect_threats(
         """,
         (recent_start_s, recent_end_s, ip_threshold),
     )
-    high_ip_requests = [
-        {"ip": ip, "requests": cnt} for ip, cnt in cur.fetchall()
-    ]
+    high_ip_requests = [{"ip": ip, "requests": cnt} for ip, cnt in cur.fetchall()]
 
     conn.close()
 
diff --git a/scripts/init_db.py b/scripts/init_db.py
index f378b5c..b9ea07d 100644
--- a/scripts/init_db.py
+++ b/scripts/init_db.py
@@ -61,7 +61,9 @@ try:
             suffix = match.group(1)
             number = int(suffix.lstrip(".")) if suffix else 0
             log_files.append((number, os.path.join(LOG_DIR, f)))
-    log_files = [path for _, path in sorted(log_files, key=lambda x: x[0], reverse=True)]
+    log_files = [
+        path for _, path in sorted(log_files, key=lambda x: x[0], reverse=True)
+    ]
 except FileNotFoundError:
     print(f"[ERROR] Log directory not found: {LOG_DIR}")
     exit(1)
diff --git a/scripts/nginx_config.py b/scripts/nginx_config.py
index dbd635d..bc585a7 100644
--- a/scripts/nginx_config.py
+++ b/scripts/nginx_config.py
@@ -93,4 +93,3 @@ def parse_servers(paths: Set[Path]) -> List[Dict[str, str]]:
                 entry["root"] = " ".join(directives["root"])
             servers.append(entry)
     return servers
-
diff --git a/templates/index.html b/templates/index.html
index b1cbf89..84c6214 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -180,6 +180,10 @@
       });
     }
 
+    function destroyAllCharts() {
+      Object.values(containers).forEach(destroyCharts);
+    }
+
     function loadReports() {
       let path;
       let container;
@@ -296,6 +300,7 @@
     }
 
     function switchTab(name) {
+      destroyAllCharts();
       currentTab = name;
       tabs.forEach(tab => {
         tab.classList.toggle('is-active', tab.dataset.tab === name);
diff --git a/tests/test_importer.py b/tests/test_importer.py
index 349786b..38c9be9 100644
--- a/tests/test_importer.py
+++ b/tests/test_importer.py
@@ -15,10 +15,10 @@ def sample_logs(tmp_path):
     log_dir.mkdir(parents=True, exist_ok=True)
 
     (log_dir / "access.log.1").write_text(
-        "127.0.0.1 - example.com [01/Jan/2024:10:00:00 +0000] \"GET / HTTP/1.1\" 200 123 \"-\" \"curl\" MISS\n"
+        '127.0.0.1 - example.com [01/Jan/2024:10:00:00 +0000] "GET / HTTP/1.1" 200 123 "-" "curl" MISS\n'
     )
     (log_dir / "access.log").write_text(
-        "127.0.0.1 - example.com [01/Jan/2024:10:05:00 +0000] \"GET /about HTTP/1.1\" 200 123 \"-\" \"curl\" MISS\n"
+        '127.0.0.1 - example.com [01/Jan/2024:10:05:00 +0000] "GET /about HTTP/1.1" 200 123 "-" "curl" MISS\n'
     )
 
     yield log_dir
@@ -59,4 +59,3 @@ def test_idempotent_import(sample_logs, tmp_path):
 
     assert first_count == 2
     assert second_count == first_count
-
diff --git a/tests/test_nginx_config.py b/tests/test_nginx_config.py
index 782c635..a6494a7 100644
--- a/tests/test_nginx_config.py
+++ b/tests/test_nginx_config.py
@@ -67,4 +67,3 @@ server {
     assert servers[1]["server_name"] == "example.org"
     assert servers[1]["listen"] == "443 ssl"
     assert "proxy_cache" not in servers[1]
-
diff --git a/tests/test_run_analysis.py b/tests/test_run_analysis.py
index 66d00df..fad7953 100644
--- a/tests/test_run_analysis.py
+++ b/tests/test_run_analysis.py
@@ -14,7 +14,7 @@ def test_script_invokes_commands(tmp_path):
 
     calls = tmp_path / "calls.txt"
     python_stub = tmp_path / "python"
-    python_stub.write_text(f"#!/usr/bin/env bash\necho \"$*\" >> \"{calls}\"\n")
+    python_stub.write_text(f'#!/usr/bin/env bash\necho "$*" >> "{calls}"\n')
     python_stub.chmod(0o755)
     (tmp_path / "python3").write_text(f"#!/usr/bin/env bash\nexit 0\n")
     (tmp_path / "python3").chmod(0o755)

From 5d2546ad60d4676faf2d2c8944b75ba2fb51b104 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 18:01:26 -0500
Subject: [PATCH 07/26] Add chart loading management

---
 scripts/generate_reports.py | 15 ++++----
 static/chartManager.js      | 49 +++++++++++++++++++++++++
 templates/index.html        | 71 ++++++++++++++++++++-----------------
 3 files changed, 97 insertions(+), 38 deletions(-)
 create mode 100644 static/chartManager.js

diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 664a3a5..e587e6e 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -58,14 +58,17 @@ def _save_json(path: Path, data: List[Dict]) -> None:
 
 
 def _copy_icons() -> None:
-    """Copy vendored icons to the output directory."""
+    """Copy vendored icons and scripts to the output directory."""
     src_dir = Path("static/icons")
     dst_dir = OUTPUT_DIR / "icons"
-    if not src_dir.is_dir():
-        return
-    dst_dir.mkdir(parents=True, exist_ok=True)
-    for icon in src_dir.glob("*.svg"):
-        shutil.copy(icon, dst_dir / icon.name)
+    if src_dir.is_dir():
+        dst_dir.mkdir(parents=True, exist_ok=True)
+        for icon in src_dir.glob("*.svg"):
+            shutil.copy(icon, dst_dir / icon.name)
+
+    js_src = Path("static/chartManager.js")
+    if js_src.is_file():
+        shutil.copy(js_src, OUTPUT_DIR / js_src.name)
 
 
 def _render_snippet(report: Dict, out_dir: Path) -> None:
diff --git a/static/chartManager.js b/static/chartManager.js
new file mode 100644
index 0000000..79d83fc
--- /dev/null
+++ b/static/chartManager.js
@@ -0,0 +1,49 @@
+export let currentLoad = null;
+const loadInfo = new Map();
+
+export function newLoad(container) {
+  if (currentLoad) {
+    abortLoad(currentLoad);
+  }
+  reset(container);
+  const controller = new AbortController();
+  const token = { controller, charts: new Map() };
+  loadInfo.set(token, token);
+  currentLoad = token;
+  return token;
+}
+
+export function abortLoad(token) {
+  const info = loadInfo.get(token);
+  if (!info) return;
+  info.controller.abort();
+  info.charts.forEach(chart => {
+    try {
+      chart.destroy();
+    } catch (e) {}
+  });
+  loadInfo.delete(token);
+  if (currentLoad === token) {
+    currentLoad = null;
+  }
+}
+
+export function registerChart(token, id, chart) {
+  const info = loadInfo.get(token);
+  if (info) {
+    info.charts.set(id, chart);
+  } else {
+    chart.destroy();
+  }
+}
+
+export function reset(container) {
+  if (!container) return;
+  container.querySelectorAll('canvas').forEach(c => {
+    const chart = Chart.getChart(c);
+    if (chart) {
+      chart.destroy();
+    }
+  });
+  container.innerHTML = '';
+}
diff --git a/templates/index.html b/templates/index.html
index 84c6214..1b27003 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -72,7 +72,14 @@
   <script src="https://cdn.jsdelivr.net/npm/chart.js"></script>
   <script src="https://cdn.jsdelivr.net/npm/jquery@3.7.0/dist/jquery.min.js"></script>
   <script src="https://cdn.datatables.net/1.13.4/js/jquery.dataTables.min.js"></script>
-  <script>
+  <script type="module">
+    import {
+      newLoad,
+      abortLoad,
+      registerChart,
+      reset,
+      currentLoad,
+    } from './chartManager.js';
     const intervalSelect = document.getElementById('interval-select');
     const domainSelect = document.getElementById('domain-select');
     const intervalControl = document.getElementById('interval-control');
@@ -105,20 +112,22 @@
     let currentDomain = domainSelect.value;
     let currentTab = 'overview';
 
-    function initReport(rep, base) {
-      fetch(base + '/' + rep.json)
+    function initReport(token, rep, base) {
+      fetch(base + '/' + rep.json, { signal: token.controller.signal })
         .then(r => r.json())
         .then(data => {
+          if (token !== currentLoad) return;
           const bucketField = rep.bucket || 'bucket';
           if (rep.chart === 'table') {
             const rows = data.map(x => [x[bucketField], x.value]);
-            new DataTable('#table-' + rep.name, {
+            const table = new DataTable('#table-' + rep.name, {
               data: rows,
               columns: [
                 { title: rep.bucket_label || 'Bucket' },
                 { title: 'Value' }
               ]
             });
+            registerChart(token, rep.name, table);
             return;
           }
 
@@ -146,7 +155,7 @@
             dataset.backgroundColor = 'rgba(54, 162, 235, 0.5)';
             dataset.borderColor = 'rgba(54, 162, 235, 1)';
           }
-          new Chart(document.getElementById('chart-' + rep.name), {
+          const chart = new Chart(document.getElementById('chart-' + rep.name), {
             type: chartType,
             data: {
               labels: labels,
@@ -154,6 +163,7 @@
             },
             options: options
           });
+          registerChart(token, rep.name, chart);
         });
     }
 
@@ -171,18 +181,7 @@
         });
     }
 
-    function destroyCharts(container) {
-      container.querySelectorAll('canvas').forEach(c => {
-        const chart = Chart.getChart(c);
-        if (chart) {
-          chart.destroy();
-        }
-      });
-    }
-
-    function destroyAllCharts() {
-      Object.values(containers).forEach(destroyCharts);
-    }
+    // Reset helpers managed by chartManager
 
     function loadReports() {
       let path;
@@ -196,27 +195,29 @@
       } else {
         container = containers.domain;
         if (!currentDomain) {
-          destroyCharts(container);
+          reset(container);
           container.innerHTML = '<p>Select a domain</p>';
           return;
         }
         path = 'domains/' + encodeURIComponent(currentDomain) + '/' + currentInterval;
       }
 
-        fetch(path + '/reports.json')
-          .then(r => r.json())
-          .then(reports => {
-            destroyCharts(container);
-            container.innerHTML = '';
-            reports.forEach(rep => {
-              fetch(path + '/' + rep.html)
-                .then(r => r.text())
-                .then(html => {
-                  container.insertAdjacentHTML('beforeend', html);
-                  initReport(rep, path);
-                });
-            });
+      const token = newLoad(container);
+
+      fetch(path + '/reports.json', { signal: token.controller.signal })
+        .then(r => r.json())
+        .then(reports => {
+          if (token !== currentLoad) return;
+          reports.forEach(rep => {
+            fetch(path + '/' + rep.html, { signal: token.controller.signal })
+              .then(r => r.text())
+              .then(html => {
+                if (token !== currentLoad) return;
+                container.insertAdjacentHTML('beforeend', html);
+                initReport(token, rep, path);
+              });
           });
+        });
     }
 
     function loadAnalysis() {
@@ -300,7 +301,8 @@
     }
 
     function switchTab(name) {
-      destroyAllCharts();
+      abortLoad(currentLoad);
+      Object.values(containers).forEach(reset);
       currentTab = name;
       tabs.forEach(tab => {
         tab.classList.toggle('is-active', tab.dataset.tab === name);
@@ -322,11 +324,16 @@
 
     intervalSelect.addEventListener('change', () => {
       currentInterval = intervalSelect.value;
+      abortLoad(currentLoad);
+      reset(containers.all);
+      reset(containers.domain);
       loadReports();
     });
 
     domainSelect.addEventListener('change', () => {
       currentDomain = domainSelect.value;
+      abortLoad(currentLoad);
+      reset(containers.domain);
       loadReports();
     });
 

From 1d4e99c69bf83adc7c46e1494b8c33b118ad57a6 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 19 Jul 2025 18:19:58 -0500
Subject: [PATCH 08/26] Add multi-bucket support for tables and update reports

---
 reports.yml                 | 81 +++++++++++++++++++++++++------------
 scripts/generate_reports.py |  4 ++
 templates/index.html        | 19 +++++----
 tests/test_reports.py       | 56 +++++++++++++++++++++++++
 4 files changed, 127 insertions(+), 33 deletions(-)

diff --git a/reports.yml b/reports.yml
index c9b9cd3..1ae8e6f 100644
--- a/reports.yml
+++ b/reports.yml
@@ -75,47 +75,78 @@
   label: Top Paths
   icon: map
   chart: table
-  bucket: path
-  bucket_label: Path
+  buckets:
+    - domain
+    - path
+  bucket_label:
+    - Domain
+    - Path
   query: |
-    SELECT path AS path,
-           COUNT(*) AS value
-    FROM (
-        SELECT substr(substr(request, instr(request, ' ') + 1), 1,
+    WITH paths AS (
+        SELECT host AS domain,
+               substr(substr(request, instr(request, ' ') + 1), 1,
                       instr(substr(request, instr(request, ' ') + 1), ' ') - 1) AS path
         FROM logs
+    ), ranked AS (
+        SELECT domain, path, COUNT(*) AS value,
+               ROW_NUMBER() OVER (PARTITION BY domain ORDER BY COUNT(*) DESC) AS rn
+        FROM paths
+        GROUP BY domain, path
     )
-    GROUP BY path
-    ORDER BY value DESC
-    LIMIT 20
+    SELECT domain, path, value
+    FROM ranked
+    WHERE rn <= 20
+    ORDER BY domain, value DESC
 
 - name: user_agents
   label: User Agents
   icon: user
   chart: table
-  bucket: user_agent
-  bucket_label: User Agent
+  buckets:
+    - domain
+    - user_agent
+  bucket_label:
+    - Domain
+    - User Agent
   query: |
-    SELECT user_agent AS user_agent,
-           COUNT(*) AS value
-    FROM logs
-    GROUP BY user_agent
-    ORDER BY value DESC
-    LIMIT 20
+    WITH ua AS (
+        SELECT host AS domain, user_agent
+        FROM logs
+    ), ranked AS (
+        SELECT domain, user_agent, COUNT(*) AS value,
+               ROW_NUMBER() OVER (PARTITION BY domain ORDER BY COUNT(*) DESC) AS rn
+        FROM ua
+        GROUP BY domain, user_agent
+    )
+    SELECT domain, user_agent, value
+    FROM ranked
+    WHERE rn <= 20
+    ORDER BY domain, value DESC
 
 - name: referrers
   label: Referrers
   icon: link
   chart: table
-  bucket: referrer
-  bucket_label: Referrer
+  buckets:
+    - domain
+    - referrer
+  bucket_label:
+    - Domain
+    - Referrer
   query: |
-    SELECT referer AS referrer,
-           COUNT(*) AS value
-    FROM logs
-    GROUP BY referrer
-    ORDER BY value DESC
-    LIMIT 20
+    WITH ref AS (
+        SELECT host AS domain, referer AS referrer
+        FROM logs
+    ), ranked AS (
+        SELECT domain, referrer, COUNT(*) AS value,
+               ROW_NUMBER() OVER (PARTITION BY domain ORDER BY COUNT(*) DESC) AS rn
+        FROM ref
+        GROUP BY domain, referrer
+    )
+    SELECT domain, referrer, value
+    FROM ranked
+    WHERE rn <= 20
+    ORDER BY domain, value DESC
 
 - name: status_distribution
   label: HTTP Statuses
diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index e587e6e..265da2d 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -182,6 +182,8 @@ def _generate_interval(interval: str, domain: Optional[str] = None) -> None:
             entry["icon"] = definition["icon"]
         if "bucket" in definition:
             entry["bucket"] = definition["bucket"]
+        if "buckets" in definition:
+            entry["buckets"] = definition["buckets"]
         if "bucket_label" in definition:
             entry["bucket_label"] = definition["bucket_label"]
         if "color" in definition:
@@ -268,6 +270,8 @@ def _generate_global() -> None:
             entry["icon"] = definition["icon"]
         if "bucket" in definition:
             entry["bucket"] = definition["bucket"]
+        if "buckets" in definition:
+            entry["buckets"] = definition["buckets"]
         if "bucket_label" in definition:
             entry["bucket_label"] = definition["bucket_label"]
         if "color" in definition:
diff --git a/templates/index.html b/templates/index.html
index 1b27003..edb53f6 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -117,21 +117,24 @@
         .then(r => r.json())
         .then(data => {
           if (token !== currentLoad) return;
-          const bucketField = rep.bucket || 'bucket';
+          const bucketFields = rep.buckets || [rep.bucket || 'bucket'];
+          const labels = Array.isArray(rep.bucket_label)
+            ? rep.bucket_label
+            : [rep.bucket_label || 'Bucket'];
           if (rep.chart === 'table') {
-            const rows = data.map(x => [x[bucketField], x.value]);
+            const rows = data.map(x => bucketFields.map(f => x[f]).concat(x.value));
+            const columns = labels.map(l => ({ title: l }));
+            columns.push({ title: 'Value' });
             const table = new DataTable('#table-' + rep.name, {
               data: rows,
-              columns: [
-                { title: rep.bucket_label || 'Bucket' },
-                { title: 'Value' }
-              ]
+              columns: columns
             });
             registerChart(token, rep.name, table);
             return;
           }
 
-          const labels = data.map(x => x[bucketField]);
+          const bucketField = bucketFields[0];
+          const labelsArr = data.map(x => x[bucketField]);
           const values = data.map(x => x.value);
           const chartType = rep.chart === 'stackedBar' ? 'bar' : rep.chart;
           const options = { scales: { y: { beginAtZero: true } } };
@@ -158,7 +161,7 @@
           const chart = new Chart(document.getElementById('chart-' + rep.name), {
             type: chartType,
             data: {
-              labels: labels,
+              labels: labelsArr,
               datasets: [dataset]
             },
             options: options
diff --git a/tests/test_reports.py b/tests/test_reports.py
index 75d7737..f9399df 100644
--- a/tests/test_reports.py
+++ b/tests/test_reports.py
@@ -253,3 +253,59 @@ def test_global_stats_file(tmp_path, sample_reports, monkeypatch):
     assert stats["unique_domains"] == 1
     assert isinstance(stats["generated_at"], str)
     assert stats["generation_seconds"] >= 0
+
+
+def test_multi_bucket_table(tmp_path, monkeypatch):
+    db_path = tmp_path / "database" / "ngxstat.db"
+    setup_db(db_path)
+    # add a second domain entry
+    conn = sqlite3.connect(db_path)
+    cur = conn.cursor()
+    cur.execute(
+        "INSERT INTO logs (ip, host, time, request, status, bytes_sent, referer, user_agent, cache_status) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)",
+        (
+            "127.0.0.1",
+            "foo.com",
+            "2024-01-01 10:10:00",
+            "GET /foo HTTP/1.1",
+            200,
+            100,
+            "-",
+            "curl",
+            "MISS",
+        ),
+    )
+    conn.commit()
+    conn.close()
+
+    cfg = tmp_path / "reports.yml"
+    cfg.write_text(
+        """
+- name: multi
+  chart: table
+  global: true
+  buckets: [domain, agent]
+  bucket_label: [Domain, Agent]
+  query: |
+    SELECT host AS domain, user_agent AS agent, COUNT(*) AS value
+    FROM logs
+    GROUP BY host, agent
+"""
+    )
+
+    monkeypatch.setattr(gr, "DB_PATH", db_path)
+    monkeypatch.setattr(gr, "OUTPUT_DIR", tmp_path / "output")
+    monkeypatch.setattr(gr, "REPORT_CONFIG", cfg)
+    monkeypatch.setattr(
+        gr, "TEMPLATE_DIR", Path(__file__).resolve().parents[1] / "templates"
+    )
+
+    gr._generate_global()
+    gr._generate_interval("hourly")
+
+    data = json.loads((tmp_path / "output" / "global" / "multi.json").read_text())
+    assert {"domain", "agent", "value"} <= data[0].keys()
+    reports = json.loads((tmp_path / "output" / "global" / "reports.json").read_text())
+    entry = next(r for r in reports if r["name"] == "multi")
+    assert entry["buckets"] == ["domain", "agent"]
+    assert entry["bucket_label"] == ["Domain", "Agent"]

From 2300849fdcce104e868b76f69ca63ac65c5d4a03 Mon Sep 17 00:00:00 2001
From: Jordan Wages <jordan@jordanwages.com>
Date: Sat, 2 Aug 2025 03:12:59 -0500
Subject: [PATCH 09/26] Place generated marker in output directory

---
 scripts/generate_reports.py | 13 +++++++++++++
 tests/test_reports.py       | 22 +++++++++++++++++++---
 2 files changed, 32 insertions(+), 3 deletions(-)

diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 265da2d..a45e4eb 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -15,6 +15,7 @@ DB_PATH = Path("database/ngxstat.db")
 OUTPUT_DIR = Path("output")
 TEMPLATE_DIR = Path("templates")
 REPORT_CONFIG = Path("reports.yml")
+GENERATED_MARKER = OUTPUT_DIR / "generated.txt"
 
 # Mapping of interval names to SQLite strftime formats.  These strings are
 # substituted into report queries whenever the special ``{bucket}`` token is
@@ -30,6 +31,18 @@ INTERVAL_FORMATS = {
 app = typer.Typer(help="Generate aggregated log reports")
 
 
+@app.callback()
+def _cli_callback(ctx: typer.Context) -> None:
+    """Register post-command hook to note generation time."""
+
+    def _write_marker() -> None:
+        OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
+        timestamp = datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S")
+        GENERATED_MARKER.write_text(f"{timestamp}\n")
+
+    ctx.call_on_close(_write_marker)
+
+
 def _get_domains() -> List[str]:
     """Return a sorted list of unique domains from the logs table."""
     conn = sqlite3.connect(DB_PATH)
diff --git a/tests/test_reports.py b/tests/test_reports.py
index f9399df..fa8f0a0 100644
--- a/tests/test_reports.py
+++ b/tests/test_reports.py
@@ -2,8 +2,10 @@ import sqlite3
 from pathlib import Path
 import json
 import sys
+from datetime import datetime
 
 import pytest
+from typer.testing import CliRunner
 
 REPO_ROOT = Path(__file__).resolve().parents[1]
 sys.path.append(str(REPO_ROOT))
@@ -199,9 +201,23 @@ def test_generate_root_index(tmp_path, sample_reports, monkeypatch):
     assert '<option value="Global">' not in content
     assert '<option value="analysis">' not in content
 
-    # check for domain options
-    assert '<option value="foo.com">' in content
-    assert '<option value="bar.com">' in content
+
+def test_generated_marker_written(tmp_path, monkeypatch):
+    out_dir = tmp_path / "output"
+    monkeypatch.setattr(gr, "OUTPUT_DIR", out_dir)
+    monkeypatch.setattr(gr, "TEMPLATE_DIR", REPO_ROOT / "templates")
+    monkeypatch.setattr(gr, "GENERATED_MARKER", out_dir / "generated.txt")
+    monkeypatch.setattr(gr, "_copy_icons", lambda: None)
+    (out_dir / "hourly").mkdir(parents=True)
+
+    runner = CliRunner()
+    result = runner.invoke(gr.app, ["index"])
+    assert result.exit_code == 0, result.output
+
+    marker = out_dir / "generated.txt"
+    assert marker.exists()
+    content = marker.read_text().strip()
+    datetime.strptime(content, "%Y-%m-%d %H:%M:%S")
 
 
 def test_global_reports_once(tmp_path, sample_reports, monkeypatch):

From 91f87689d07039ef73527f22727c3abcf568e408 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 04:57:20 -0500
Subject: [PATCH 10/26] ci: add Forgejo Actions workflow for lint, test, and
 sample reports artifact

---
 .forgejo/workflows/ci.yml | 92 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 92 insertions(+)
 create mode 100644 .forgejo/workflows/ci.yml

diff --git a/.forgejo/workflows/ci.yml b/.forgejo/workflows/ci.yml
new file mode 100644
index 0000000..65439eb
--- /dev/null
+++ b/.forgejo/workflows/ci.yml
@@ -0,0 +1,92 @@
+name: CI
+
+on:
+  push:
+  pull_request:
+  workflow_dispatch:
+
+jobs:
+  lint-and-test:
+    name: Lint and test (py${{ matrix.python }})
+    # Adjust this label to match your Forgejo runner
+    runs-on: docker
+    container:
+      image: python:${{ matrix.python }}-bookworm
+    strategy:
+      fail-fast: false
+      matrix:
+        python: ["3.10", "3.11", "3.12"]
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Set up Python (inside container)
+        run: |
+          python -m pip install --upgrade pip
+          pip --version
+
+      - name: Install dependencies
+        run: |
+          pip install -r requirements.txt
+          pip install pytest
+
+      - name: Format check (black)
+        run: black --check .
+
+      - name: Lint (flake8)
+        run: flake8 .
+
+      - name: Run tests (pytest)
+        env:
+          PYTHONDONTWRITEBYTECODE: "1"
+        run: pytest -q
+
+  build-reports:
+    name: Build sample reports artifact
+    needs: lint-and-test
+    runs-on: docker
+    container:
+      image: python:3.11-bookworm
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install -r requirements.txt
+
+      - name: Seed minimal DB and generate reports
+        run: |
+          python - <<'PY'
+          import sqlite3, pathlib
+          db = pathlib.Path('database/ngxstat.db')
+          db.parent.mkdir(parents=True, exist_ok=True)
+          conn = sqlite3.connect(db)
+          cur = conn.cursor()
+          cur.execute('''CREATE TABLE IF NOT EXISTS logs (
+              id INTEGER PRIMARY KEY,
+              ip TEXT,
+              host TEXT,
+              time TEXT,
+              request TEXT,
+              status INTEGER,
+              bytes_sent INTEGER,
+              referer TEXT,
+              user_agent TEXT,
+              cache_status TEXT
+          )''')
+          cur.execute("INSERT INTO logs (ip, host, time, request, status, bytes_sent, referer, user_agent, cache_status) VALUES ('127.0.0.1','example.com','2024-01-01 10:00:00','GET / HTTP/1.1',200,100,'-','curl','MISS')")
+          cur.execute("INSERT INTO logs (ip, host, time, request, status, bytes_sent, referer, user_agent, cache_status) VALUES ('127.0.0.1','example.com','2024-01-01 10:05:00','GET /about HTTP/1.1',200,100,'-','curl','MISS')")
+          conn.commit(); conn.close()
+          PY
+          python scripts/generate_reports.py global
+          python scripts/generate_reports.py hourly
+          python scripts/generate_reports.py index
+
+      - name: Upload reports artifact
+        uses: actions/upload-artifact@v4
+        with:
+          name: ngxstat-reports
+          path: output/
+

From 0363c372027d1df49ef9fd20ea642f4e065a989d Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:05:33 -0500
Subject: [PATCH 11/26] ci: replace Node-based actions with manual git clone
 and Debian container

---
 .forgejo/workflows/ci.yml | 115 +++++++++++++++++++++++---------------
 1 file changed, 71 insertions(+), 44 deletions(-)

diff --git a/.forgejo/workflows/ci.yml b/.forgejo/workflows/ci.yml
index 65439eb..a5f4930 100644
--- a/.forgejo/workflows/ci.yml
+++ b/.forgejo/workflows/ci.yml
@@ -6,58 +6,90 @@ on:
   workflow_dispatch:
 
 jobs:
-  lint-and-test:
-    name: Lint and test (py${{ matrix.python }})
-    # Adjust this label to match your Forgejo runner
+  ci:
+    name: Lint, test, and build
+    # This label must match your Forgejo runner's label
     runs-on: docker
-    container:
-      image: python:${{ matrix.python }}-bookworm
-    strategy:
-      fail-fast: false
-      matrix:
-        python: ["3.10", "3.11", "3.12"]
+    # Use a clean Debian container so tools are predictable
+    container: debian:stable-slim
+    env:
+      PYTHONDONTWRITEBYTECODE: "1"
+      PIP_DISABLE_PIP_VERSION_CHECK: "1"
+      UV_SYSTEM_PYTHON: "1"
     steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Set up Python (inside container)
+      - name: Install build tooling
         run: |
+          set -euo pipefail
+          apt-get update
+          DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \
+            git ca-certificates python3 python3-venv python3-pip python3-setuptools \
+            python3-wheel sqlite3
+          update-ca-certificates || true
+
+      - name: Checkout repository (manual)
+        run: |
+          set -euo pipefail
+          if [ -f Makefile ] || [ -d .git ]; then
+            echo "Repository present in workspace; skipping clone"
+            exit 0
+          fi
+          REMOTE_URL="${CI_REPOSITORY_URL:-}"
+          if [ -z "$REMOTE_URL" ]; then
+            if [ -n "${GITHUB_SERVER_URL:-}" ] && [ -n "${GITHUB_REPOSITORY:-}" ]; then
+              REMOTE_URL="${GITHUB_SERVER_URL%/}/${GITHUB_REPOSITORY}.git"
+            elif [ -n "${GITHUB_REPOSITORY:-}" ]; then
+              REMOTE_URL="https://git.jordanwages.com/${GITHUB_REPOSITORY}.git"
+            else
+              echo "Unable to determine repository URL from CI environment" >&2
+              exit 1
+            fi
+          fi
+          AUTH_URL="$REMOTE_URL"
+          if [ -n "${GITHUB_TOKEN:-}" ]; then
+            ACTOR="${GITHUB_ACTOR:-oauth2}"
+            AUTH_URL=$(printf '%s' "$REMOTE_URL" | sed -E "s#^https://#https://${ACTOR}:${GITHUB_TOKEN}@#")
+          fi
+          echo "Cloning from: $REMOTE_URL"
+          if ! git clone --depth 1 "$AUTH_URL" .; then
+            echo "Auth clone failed; trying anonymous clone..." >&2
+            git clone --depth 1 "$REMOTE_URL" .
+          fi
+          if [ -n "${GITHUB_SHA:-}" ]; then
+            git fetch --depth 1 origin "$GITHUB_SHA" || true
+            git checkout -q "$GITHUB_SHA" || true
+          elif [ -n "${GITHUB_REF_NAME:-}" ]; then
+            git fetch --depth 1 origin "$GITHUB_REF_NAME" || true
+            git checkout -q "$GITHUB_REF_NAME" || true
+          fi
+
+      - name: Set up venv and install deps
+        run: |
+          set -euo pipefail
+          python3 -m venv .venv
+          . .venv/bin/activate
           python -m pip install --upgrade pip
-          pip --version
-
-      - name: Install dependencies
-        run: |
           pip install -r requirements.txt
           pip install pytest
 
       - name: Format check (black)
-        run: black --check .
+        run: |
+          . .venv/bin/activate
+          black --check .
 
       - name: Lint (flake8)
-        run: flake8 .
+        run: |
+          . .venv/bin/activate
+          flake8 .
 
       - name: Run tests (pytest)
-        env:
-          PYTHONDONTWRITEBYTECODE: "1"
-        run: pytest -q
-
-  build-reports:
-    name: Build sample reports artifact
-    needs: lint-and-test
-    runs-on: docker
-    container:
-      image: python:3.11-bookworm
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Install dependencies
         run: |
-          python -m pip install --upgrade pip
-          pip install -r requirements.txt
+          . .venv/bin/activate
+          pytest -q
 
-      - name: Seed minimal DB and generate reports
+      - name: Build sample reports (no artifact upload)
         run: |
+          set -euo pipefail
+          . .venv/bin/activate
           python - <<'PY'
           import sqlite3, pathlib
           db = pathlib.Path('database/ngxstat.db')
@@ -83,10 +115,5 @@ jobs:
           python scripts/generate_reports.py global
           python scripts/generate_reports.py hourly
           python scripts/generate_reports.py index
-
-      - name: Upload reports artifact
-        uses: actions/upload-artifact@v4
-        with:
-          name: ngxstat-reports
-          path: output/
-
+          tar -czf ngxstat-reports.tar.gz -C output .
+          echo "Built sample reports archive: ngxstat-reports.tar.gz"

From 979fbb0e64348adbf4c0a13ba34172275cc6a1e2 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:14:01 -0500
Subject: [PATCH 12/26] ci(lint): configure flake8 excludes/line-length; fix
 F541 and F401 in tests

---
 .flake8                    | 6 ++++++
 tests/test_nginx_config.py | 2 +-
 tests/test_run_analysis.py | 2 +-
 3 files changed, 8 insertions(+), 2 deletions(-)
 create mode 100644 .flake8

diff --git a/.flake8 b/.flake8
new file mode 100644
index 0000000..0ba73e9
--- /dev/null
+++ b/.flake8
@@ -0,0 +1,6 @@
+[flake8]
+exclude = .git, .venv, output, static/icons
+max-line-length = 160
+per-file-ignores =
+    tests/test_*.py: E402
+
diff --git a/tests/test_nginx_config.py b/tests/test_nginx_config.py
index a6494a7..b2b1317 100644
--- a/tests/test_nginx_config.py
+++ b/tests/test_nginx_config.py
@@ -1,6 +1,6 @@
 import sys
 from pathlib import Path
-import pytest
+import pytest  # noqa: F401
 
 REPO_ROOT = Path(__file__).resolve().parents[1]
 sys.path.append(str(REPO_ROOT))
diff --git a/tests/test_run_analysis.py b/tests/test_run_analysis.py
index fad7953..7150895 100644
--- a/tests/test_run_analysis.py
+++ b/tests/test_run_analysis.py
@@ -16,7 +16,7 @@ def test_script_invokes_commands(tmp_path):
     python_stub = tmp_path / "python"
     python_stub.write_text(f'#!/usr/bin/env bash\necho "$*" >> "{calls}"\n')
     python_stub.chmod(0o755)
-    (tmp_path / "python3").write_text(f"#!/usr/bin/env bash\nexit 0\n")
+    (tmp_path / "python3").write_text("#!/usr/bin/env bash\nexit 0\n")
     (tmp_path / "python3").chmod(0o755)
 
     env = os.environ.copy()

From 136b4196ea66b9453d776b5fb2d3c03a7a7e0ae3 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:15:59 -0500
Subject: [PATCH 13/26] ci: add pytest --maxfail=1 and simple pip/venv cache at
 /cache if available

---
 .forgejo/workflows/ci.yml | 30 ++++++++++++++++++++++++++----
 1 file changed, 26 insertions(+), 4 deletions(-)

diff --git a/.forgejo/workflows/ci.yml b/.forgejo/workflows/ci.yml
index a5f4930..2717345 100644
--- a/.forgejo/workflows/ci.yml
+++ b/.forgejo/workflows/ci.yml
@@ -65,11 +65,33 @@ jobs:
       - name: Set up venv and install deps
         run: |
           set -euo pipefail
-          python3 -m venv .venv
+          # Prefer persistent cache if runner provides /cache
+          USE_CACHE=0
+          if [ -d /cache ] && [ -w /cache ]; then
+            export PIP_CACHE_DIR=/cache/pip
+            mkdir -p "$PIP_CACHE_DIR"
+            REQ_HASH=$(sha256sum requirements.txt | awk '{print $1}')
+            PYVER=$(python3 -c 'import sys;print(".".join(map(str, sys.version_info[:2])))')
+            CACHE_VENV="/cache/venv-${REQ_HASH}-py${PYVER}"
+            if [ -d "$CACHE_VENV" ]; then
+              echo "Using cached virtualenv: $CACHE_VENV"
+              ln -s "$CACHE_VENV" .venv
+              USE_CACHE=1
+            else
+              echo "Creating cached virtualenv: $CACHE_VENV"
+              python3 -m venv "$CACHE_VENV"
+              ln -s "$CACHE_VENV" .venv
+            fi
+          fi
+
           . .venv/bin/activate
           python -m pip install --upgrade pip
-          pip install -r requirements.txt
-          pip install pytest
+          if [ "$USE_CACHE" = "1" ]; then
+            # Ensure required packages are present; pip will use cache
+            pip install -r requirements.txt pytest || pip install -r requirements.txt pytest
+          else
+            pip install -r requirements.txt pytest
+          fi
 
       - name: Format check (black)
         run: |
@@ -84,7 +106,7 @@ jobs:
       - name: Run tests (pytest)
         run: |
           . .venv/bin/activate
-          pytest -q
+          pytest -q --maxfail=1
 
       - name: Build sample reports (no artifact upload)
         run: |

From ab4f017ba815d5b364403a87f4c41a1e866f8302 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:17:51 -0500
Subject: [PATCH 14/26] ci: robust venv creation; verify cached venv has
 activate and fallback to local

---
 .forgejo/workflows/ci.yml | 23 ++++++++++++++++-------
 1 file changed, 16 insertions(+), 7 deletions(-)

diff --git a/.forgejo/workflows/ci.yml b/.forgejo/workflows/ci.yml
index 2717345..cd7fb36 100644
--- a/.forgejo/workflows/ci.yml
+++ b/.forgejo/workflows/ci.yml
@@ -73,15 +73,24 @@ jobs:
             REQ_HASH=$(sha256sum requirements.txt | awk '{print $1}')
             PYVER=$(python3 -c 'import sys;print(".".join(map(str, sys.version_info[:2])))')
             CACHE_VENV="/cache/venv-${REQ_HASH}-py${PYVER}"
-            if [ -d "$CACHE_VENV" ]; then
-              echo "Using cached virtualenv: $CACHE_VENV"
-              ln -s "$CACHE_VENV" .venv
-              USE_CACHE=1
-            else
-              echo "Creating cached virtualenv: $CACHE_VENV"
+            if [ ! -f "$CACHE_VENV/bin/activate" ]; then
+              echo "Preparing cached virtualenv: $CACHE_VENV"
+              rm -rf "$CACHE_VENV" || true
               python3 -m venv "$CACHE_VENV"
-              ln -s "$CACHE_VENV" .venv
             fi
+            ln -sfn "$CACHE_VENV" .venv
+            USE_CACHE=1
+          else
+            # Fallback to local venv
+            python3 -m venv .venv
+          fi
+
+          # If the link didn't produce an activate file, fallback to local venv
+          if [ ! -f .venv/bin/activate ]; then
+            echo "Cached venv missing; creating local .venv"
+            rm -f .venv
+            python3 -m venv .venv
+            USE_CACHE=0
           fi
 
           . .venv/bin/activate

From 176359d0100b8d52370f0a154ea22a59462a4e44 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:19:48 -0500
Subject: [PATCH 15/26] lint: remove unused typing import; mark test pytest
 import as noqa F401

---
 scripts/analyze.py    | 2 +-
 tests/test_analyze.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/scripts/analyze.py b/scripts/analyze.py
index fe7b818..7c4c141 100644
--- a/scripts/analyze.py
+++ b/scripts/analyze.py
@@ -18,7 +18,7 @@ from __future__ import annotations
 
 import sqlite3
 from pathlib import Path
-from typing import Dict, List, Optional, Set
+from typing import List, Optional, Set
 from datetime import datetime, timedelta
 
 import json
diff --git a/tests/test_analyze.py b/tests/test_analyze.py
index a4358d7..138e73d 100644
--- a/tests/test_analyze.py
+++ b/tests/test_analyze.py
@@ -3,7 +3,7 @@ import json
 import sqlite3
 from pathlib import Path
 
-import pytest
+import pytest  # noqa: F401
 
 REPO_ROOT = Path(__file__).resolve().parents[1]
 sys.path.append(str(REPO_ROOT))

From 5053a4c4db726b81c614e3a647356c833ac2ff26 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:24:14 -0500
Subject: [PATCH 16/26] lint: re-enable E402; remove sys.path hacks; drop
 unused pytest imports in tests

---
 .flake8                    | 3 ---
 tests/test_analyze.py      | 6 ------
 tests/test_nginx_config.py | 4 ----
 tests/test_reports.py      | 8 +++-----
 4 files changed, 3 insertions(+), 18 deletions(-)

diff --git a/.flake8 b/.flake8
index 0ba73e9..95f9808 100644
--- a/.flake8
+++ b/.flake8
@@ -1,6 +1,3 @@
 [flake8]
 exclude = .git, .venv, output, static/icons
 max-line-length = 160
-per-file-ignores =
-    tests/test_*.py: E402
-
diff --git a/tests/test_analyze.py b/tests/test_analyze.py
index 138e73d..6e97ab6 100644
--- a/tests/test_analyze.py
+++ b/tests/test_analyze.py
@@ -1,12 +1,6 @@
-import sys
 import json
 import sqlite3
 from pathlib import Path
-
-import pytest  # noqa: F401
-
-REPO_ROOT = Path(__file__).resolve().parents[1]
-sys.path.append(str(REPO_ROOT))
 from scripts import analyze
 from scripts import generate_reports as gr
 
diff --git a/tests/test_nginx_config.py b/tests/test_nginx_config.py
index b2b1317..604b700 100644
--- a/tests/test_nginx_config.py
+++ b/tests/test_nginx_config.py
@@ -1,9 +1,5 @@
-import sys
 from pathlib import Path
-import pytest  # noqa: F401
 
-REPO_ROOT = Path(__file__).resolve().parents[1]
-sys.path.append(str(REPO_ROOT))
 from scripts import nginx_config as nc
 
 
diff --git a/tests/test_reports.py b/tests/test_reports.py
index fa8f0a0..f6c6918 100644
--- a/tests/test_reports.py
+++ b/tests/test_reports.py
@@ -1,14 +1,10 @@
 import sqlite3
 from pathlib import Path
 import json
-import sys
 from datetime import datetime
 
 import pytest
 from typer.testing import CliRunner
-
-REPO_ROOT = Path(__file__).resolve().parents[1]
-sys.path.append(str(REPO_ROOT))
 from scripts import generate_reports as gr
 
 
@@ -205,7 +201,9 @@ def test_generate_root_index(tmp_path, sample_reports, monkeypatch):
 def test_generated_marker_written(tmp_path, monkeypatch):
     out_dir = tmp_path / "output"
     monkeypatch.setattr(gr, "OUTPUT_DIR", out_dir)
-    monkeypatch.setattr(gr, "TEMPLATE_DIR", REPO_ROOT / "templates")
+    monkeypatch.setattr(
+        gr, "TEMPLATE_DIR", Path(__file__).resolve().parents[1] / "templates"
+    )
     monkeypatch.setattr(gr, "GENERATED_MARKER", out_dir / "generated.txt")
     monkeypatch.setattr(gr, "_copy_icons", lambda: None)
     (out_dir / "hourly").mkdir(parents=True)

From a8f7ac9b7a53fe920dbe28421a076dd4ff6fe5bf Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:27:02 -0500
Subject: [PATCH 17/26] lint: remove unused Path import in
 tests/test_nginx_config.py

---
 tests/test_nginx_config.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/test_nginx_config.py b/tests/test_nginx_config.py
index 604b700..cba4212 100644
--- a/tests/test_nginx_config.py
+++ b/tests/test_nginx_config.py
@@ -1,5 +1,3 @@
-from pathlib import Path
-
 from scripts import nginx_config as nc
 
 

From 9c26ae3e9027be613f723acac3c654504b1b702e Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@localhost>
Date: Sat, 16 Aug 2025 05:29:20 -0500
Subject: [PATCH 18/26] ci: ensure repo root on PYTHONPATH when running pytest

---
 .forgejo/workflows/ci.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.forgejo/workflows/ci.yml b/.forgejo/workflows/ci.yml
index cd7fb36..5cf26be 100644
--- a/.forgejo/workflows/ci.yml
+++ b/.forgejo/workflows/ci.yml
@@ -115,6 +115,7 @@ jobs:
       - name: Run tests (pytest)
         run: |
           . .venv/bin/activate
+          export PYTHONPATH="$(pwd)${PYTHONPATH:+:$PYTHONPATH}"
           pytest -q --maxfail=1
 
       - name: Build sample reports (no artifact upload)

From fab91d2e04ef2b0fe08c15f666516a20cc11e04e Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Mon, 18 Aug 2025 23:01:00 -0500
Subject: [PATCH 19/26] Phase 1 UX + JS transforms: tabs, windowing,
 percent/grouping, smoothing, stacked series, metadata pass-through, top_n

- Replace tabs with Recent/Trends/Distribution/Tables/Analysis and add sticky controls (interval, domain, window [default 7d], percent, group small, exclude '-' -> Uncached, smoothing toggle).

- Client-side transforms: time-window slicing, percent mode, group others (3%), per-report exclusions; stackedBar multi-series; moving average for error_rate.

- Generator: pass through optional UX metadata (windows_supported, window_default, group_others_threshold, exclude_values, top_n, stacked, palette) and enforce top_n LIMIT for table reports.

- Reports: add status_classes_timeseries and cache_status_timeseries; apply top_n=50 to heavy tables.

- Chart manager: add helpers (sliceWindow, excludeValues, toPercent, groupOthers, movingAverage).

- URL state + localStorage for context; per-tab filtering for Trends/Distribution/Tables.
---
 reports.yml                 |  41 +++++
 scripts/generate_reports.py |  44 +++++
 static/chartManager.js      |  60 ++++++
 templates/index.html        | 356 ++++++++++++++++++++++++++++++------
 4 files changed, 442 insertions(+), 59 deletions(-)

diff --git a/reports.yml b/reports.yml
index 1ae8e6f..709d686 100644
--- a/reports.yml
+++ b/reports.yml
@@ -48,6 +48,7 @@
   label: Top Domains
   icon: globe
   chart: table
+  top_n: 50
   per_domain: false
   bucket: domain
   bucket_label: Domain
@@ -75,6 +76,7 @@
   label: Top Paths
   icon: map
   chart: table
+  top_n: 50
   buckets:
     - domain
     - path
@@ -102,6 +104,7 @@
   label: User Agents
   icon: user
   chart: table
+  top_n: 50
   buckets:
     - domain
     - user_agent
@@ -127,6 +130,7 @@
   label: Referrers
   icon: link
   chart: table
+  top_n: 50
   buckets:
     - domain
     - referrer
@@ -170,3 +174,40 @@
     - "#209cee"
     - "#ffdd57"
     - "#f14668"
+
+# New time-series: status classes over time (stacked)
+- name: status_classes_timeseries
+  label: Status Classes Over Time
+  icon: server
+  chart: stackedBar
+  bucket: time_bucket
+  bucket_label: Time
+  stacked: true
+  query: |
+    SELECT {bucket} AS time_bucket,
+           SUM(CASE WHEN status BETWEEN 200 AND 299 THEN 1 ELSE 0 END) AS "2xx",
+           SUM(CASE WHEN status BETWEEN 300 AND 399 THEN 1 ELSE 0 END) AS "3xx",
+           SUM(CASE WHEN status BETWEEN 400 AND 499 THEN 1 ELSE 0 END) AS "4xx",
+           SUM(CASE WHEN status BETWEEN 500 AND 599 THEN 1 ELSE 0 END) AS "5xx",
+           COUNT(*) AS total
+    FROM logs
+    GROUP BY time_bucket
+    ORDER BY time_bucket
+
+# New time-series: cache status over time (compact Hit/Miss; exclude '-' by default)
+- name: cache_status_timeseries
+  label: Cache Status Over Time
+  icon: archive
+  chart: stackedBar
+  bucket: time_bucket
+  bucket_label: Time
+  stacked: true
+  exclude_values: ["-"]
+  query: |
+    SELECT {bucket} AS time_bucket,
+           SUM(CASE WHEN cache_status = 'HIT' THEN 1 ELSE 0 END) AS hit,
+           SUM(CASE WHEN cache_status = 'MISS' THEN 1 ELSE 0 END) AS miss,
+           COUNT(*) AS total
+    FROM logs
+    GROUP BY time_bucket
+    ORDER BY time_bucket
diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index a45e4eb..073e0b7 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -178,6 +178,16 @@ def _generate_interval(interval: str, domain: Optional[str] = None) -> None:
         name = definition["name"]
         query = definition["query"].replace("{bucket}", bucket)
         query = query.replace("FROM logs", "FROM logs_view")
+        # Apply top_n limit for tables (performance-friendly), if configured
+        top_n = definition.get("top_n")
+        chart_type = definition.get("chart", "line")
+        if top_n and chart_type == "table":
+            try:
+                n = int(top_n)
+                if "LIMIT" not in query.upper():
+                    query = f"{query}\nLIMIT {n}"
+            except Exception:
+                pass
         cur.execute(query)
         rows = cur.fetchall()
         headers = [c[0] for c in cur.description]
@@ -203,6 +213,18 @@ def _generate_interval(interval: str, domain: Optional[str] = None) -> None:
             entry["color"] = definition["color"]
         if "colors" in definition:
             entry["colors"] = definition["colors"]
+        # Optional UX metadata passthrough for frontend-only transforms
+        for key in (
+            "windows_supported",
+            "window_default",
+            "group_others_threshold",
+            "exclude_values",
+            "top_n",
+            "stacked",
+            "palette",
+        ):
+            if key in definition:
+                entry[key] = definition[key]
         _render_snippet(entry, out_dir)
         report_list.append(entry)
 
@@ -266,6 +288,16 @@ def _generate_global() -> None:
 
         name = definition["name"]
         query = definition["query"]
+        # Apply top_n limit for tables (performance-friendly), if configured
+        top_n = definition.get("top_n")
+        chart_type = definition.get("chart", "line")
+        if top_n and chart_type == "table":
+            try:
+                n = int(top_n)
+                if "LIMIT" not in query.upper():
+                    query = f"{query}\nLIMIT {n}"
+            except Exception:
+                pass
         cur.execute(query)
         rows = cur.fetchall()
         headers = [c[0] for c in cur.description]
@@ -291,6 +323,18 @@ def _generate_global() -> None:
             entry["color"] = definition["color"]
         if "colors" in definition:
             entry["colors"] = definition["colors"]
+        # Optional UX metadata passthrough for frontend-only transforms
+        for key in (
+            "windows_supported",
+            "window_default",
+            "group_others_threshold",
+            "exclude_values",
+            "top_n",
+            "stacked",
+            "palette",
+        ):
+            if key in definition:
+                entry[key] = definition[key]
         _render_snippet(entry, out_dir)
         report_list.append(entry)
 
diff --git a/static/chartManager.js b/static/chartManager.js
index 79d83fc..2f14f4f 100644
--- a/static/chartManager.js
+++ b/static/chartManager.js
@@ -47,3 +47,63 @@ export function reset(container) {
   });
   container.innerHTML = '';
 }
+
+// ---- Lightweight client-side data helpers ----
+
+// Slice last N rows from a time-ordered array
+export function sliceWindow(data, n) {
+  if (!Array.isArray(data) || n === undefined || n === null) return data;
+  if (n === 'all') return data;
+  const count = Number(n);
+  if (!Number.isFinite(count) || count <= 0) return data;
+  return data.slice(-count);
+}
+
+// Exclude rows whose value in key is in excluded list
+export function excludeValues(data, key, excluded = []) {
+  if (!excluded || excluded.length === 0) return data;
+  const set = new Set(excluded);
+  return data.filter(row => !set.has(row[key]));
+}
+
+// Compute percentages for categorical distributions (valueKey default 'value')
+export function toPercent(data, valueKey = 'value') {
+  const total = data.reduce((s, r) => s + (Number(r[valueKey]) || 0), 0);
+  if (total <= 0) return data.map(r => ({ ...r }));
+  return data.map(r => ({ ...r, [valueKey]: (Number(r[valueKey]) || 0) * 100 / total }));
+}
+
+// Group categories with share < threshold into an 'Other' bucket.
+export function groupOthers(data, bucketKey, valueKey = 'value', threshold = 0.03, otherLabel = 'Other') {
+  if (!Array.isArray(data) || data.length === 0) return data;
+  const total = data.reduce((s, r) => s + (Number(r[valueKey]) || 0), 0);
+  if (total <= 0) return data;
+  const major = [];
+  let other = 0;
+  for (const r of data) {
+    const v = Number(r[valueKey]) || 0;
+    if (total && v / total < threshold) {
+      other += v;
+    } else {
+      major.push({ ...r });
+    }
+  }
+  if (other > 0) major.push({ [bucketKey]: otherLabel, [valueKey]: other });
+  return major;
+}
+
+// Simple moving average over numeric array
+export function movingAverage(series, span = 3) {
+  const n = Math.max(1, Number(span) || 1);
+  const out = [];
+  for (let i = 0; i < series.length; i++) {
+    const start = Math.max(0, i - n + 1);
+    let sum = 0, cnt = 0;
+    for (let j = start; j <= i; j++) {
+      const v = Number(series[j]);
+      if (Number.isFinite(v)) { sum += v; cnt++; }
+    }
+    out.push(cnt ? sum / cnt : null);
+  }
+  return out;
+}
diff --git a/templates/index.html b/templates/index.html
index edb53f6..56dfd6f 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -12,14 +12,15 @@
 
     <div class="tabs is-toggle" id="report-tabs">
       <ul>
-        <li class="is-active" data-tab="overview"><a>Overview</a></li>
-        <li data-tab="all"><a>All Domains</a></li>
-        <li data-tab="domain"><a>Per Domain</a></li>
+        <li class="is-active" data-tab="recent"><a>Recent</a></li>
+        <li data-tab="trends"><a>Trends</a></li>
+        <li data-tab="distribution"><a>Distribution</a></li>
+        <li data-tab="tables"><a>Tables</a></li>
         <li data-tab="analysis"><a>Analysis</a></li>
       </ul>
     </div>
 
-    <div id="controls" class="field is-grouped mb-4">
+    <div id="controls" class="field is-grouped is-align-items-center mb-4" style="position: sticky; top: 0; background: white; z-index: 2; padding: 0.5rem 0;">
       <div id="interval-control" class="control has-icons-left is-hidden">
         <div class="select is-small">
           <select id="interval-select">
@@ -41,11 +42,43 @@
         </div>
         <span class="icon is-small is-left"><img src="icons/server.svg" alt="Domain"></span>
       </div>
+      <div id="window-control" class="control has-icons-left is-hidden">
+        <div class="select is-small">
+          <select id="window-select">
+            <option value="1h">Last 1h</option>
+            <option value="24h">Last 24h</option>
+            <option value="7d" selected>Last 7d</option>
+            <option value="30d">Last 30d</option>
+            <option value="all">All</option>
+          </select>
+        </div>
+        <span class="icon is-small is-left"><img src="icons/pulse.svg" alt="Window"></span>
+      </div>
+      <div id="smooth-control" class="control is-hidden">
+        <label class="checkbox is-small">
+          <input type="checkbox" id="smooth-toggle"> Smooth error rate
+        </label>
+      </div>
+      <div id="mode-percent-control" class="control is-hidden">
+        <label class="checkbox is-small">
+          <input type="checkbox" id="percent-toggle"> Percent mode
+        </label>
+      </div>
+      <div id="mode-group-control" class="control is-hidden">
+        <label class="checkbox is-small">
+          <input type="checkbox" id="group-toggle" checked> Group small into Other
+        </label>
+      </div>
+      <div id="exclude-uncached-control" class="control is-hidden">
+        <label class="checkbox is-small">
+          <input type="checkbox" id="exclude-uncached-toggle" checked> Exclude “-”
+        </label>
+      </div>
     </div>
 
-    <div id="overview-section">
+    <div id="recent-section">
       <div id="overview" class="box mb-5">
-        <h2 class="subtitle">Overview</h2>
+        <h2 class="subtitle">Recent</h2>
         <p>Total logs: <span id="stat-total">-</span></p>
         <p>Date range: <span id="stat-start">-</span> to <span id="stat-end">-</span></p>
         <p>Unique domains: <span id="stat-domains">-</span></p>
@@ -55,13 +88,17 @@
       <div id="overview-reports"></div>
     </div>
 
-    <div id="all-section" class="is-hidden">
-      <div id="reports-all"></div>
+    <div id="trends-section" class="is-hidden">
+      <div id="reports-trends"></div>
     </div>
 
-  <div id="domain-section" class="is-hidden">
-    <div id="reports-domain"></div>
-  </div>
+    <div id="distribution-section" class="is-hidden">
+      <div id="reports-distribution"></div>
+    </div>
+
+    <div id="tables-section" class="is-hidden">
+      <div id="reports-tables"></div>
+    </div>
 
   <div id="analysis-section" class="is-hidden">
     <div id="analysis-missing" class="box"></div>
@@ -79,22 +116,34 @@
       registerChart,
       reset,
       currentLoad,
+      sliceWindow,
+      excludeValues,
+      toPercent,
+      groupOthers,
+      movingAverage,
     } from './chartManager.js';
     const intervalSelect = document.getElementById('interval-select');
     const domainSelect = document.getElementById('domain-select');
     const intervalControl = document.getElementById('interval-control');
     const domainControl = document.getElementById('domain-control');
+    const windowControl = document.getElementById('window-control');
+    const modePercentControl = document.getElementById('mode-percent-control');
+    const modeGroupControl = document.getElementById('mode-group-control');
+    const excludeUncachedControl = document.getElementById('exclude-uncached-control');
+    const smoothControl = document.getElementById('smooth-control');
     const tabs = document.querySelectorAll('#report-tabs li');
     const sections = {
-      overview: document.getElementById('overview-section'),
-      all: document.getElementById('all-section'),
-      domain: document.getElementById('domain-section'),
+      recent: document.getElementById('recent-section'),
+      trends: document.getElementById('trends-section'),
+      distribution: document.getElementById('distribution-section'),
+      tables: document.getElementById('tables-section'),
       analysis: document.getElementById('analysis-section')
     };
     const containers = {
-      overview: document.getElementById('overview-reports'),
-      all: document.getElementById('reports-all'),
-      domain: document.getElementById('reports-domain')
+      recent: document.getElementById('overview-reports'),
+      trends: document.getElementById('reports-trends'),
+      distribution: document.getElementById('reports-distribution'),
+      tables: document.getElementById('reports-tables')
     };
     const analysisElems = {
       missing: document.getElementById('analysis-missing'),
@@ -108,9 +157,87 @@
     const generatedElem = document.getElementById('stat-generated');
     const elapsedElem = document.getElementById('stat-elapsed');
 
+    // Extra controls
+    const windowSelect = document.getElementById('window-select');
+    const percentToggle = document.getElementById('percent-toggle');
+    const groupToggle = document.getElementById('group-toggle');
+    const excludeUncachedToggle = document.getElementById('exclude-uncached-toggle');
+    const smoothToggle = document.getElementById('smooth-toggle');
+
     let currentInterval = intervalSelect.value;
     let currentDomain = domainSelect.value;
-    let currentTab = 'overview';
+    let currentTab = 'recent';
+    let currentWindow = windowSelect.value; // 1h, 24h, 7d, 30d, all
+    let modePercent = false;
+    let modeGroup = true;
+    let excludeUncached = true;
+    let smoothError = false;
+
+    function saveState() {
+      try {
+        localStorage.setItem('ngxstat-state', JSON.stringify({
+          tab: currentTab,
+          interval: currentInterval,
+          domain: currentDomain,
+          window: currentWindow,
+          percent: modePercent ? 1 : 0,
+          group: modeGroup ? 1 : 0,
+          exclude_dash: excludeUncached ? 1 : 0,
+          smooth: smoothError ? 1 : 0,
+        }));
+      } catch {}
+    }
+
+    function loadSavedState() {
+      try {
+        const s = JSON.parse(localStorage.getItem('ngxstat-state') || '{}');
+        if (s.tab) currentTab = s.tab;
+        if (s.interval) currentInterval = s.interval;
+        if (s.domain !== undefined) currentDomain = s.domain;
+        if (s.window) currentWindow = s.window;
+        if (s.percent !== undefined) modePercent = !!Number(s.percent);
+        if (s.group !== undefined) modeGroup = !!Number(s.group);
+        if (s.exclude_dash !== undefined) excludeUncached = !!Number(s.exclude_dash);
+        if (s.smooth !== undefined) smoothError = !!Number(s.smooth);
+      } catch {}
+    }
+
+    function applyURLParams() {
+      const params = new URLSearchParams(location.search);
+      if (params.get('tab')) currentTab = params.get('tab');
+      if (params.get('interval')) currentInterval = params.get('interval');
+      if (params.get('domain') !== null) currentDomain = params.get('domain') || '';
+      if (params.get('window')) currentWindow = params.get('window');
+      if (params.get('percent') !== null) modePercent = params.get('percent') === '1';
+      if (params.get('group') !== null) modeGroup = params.get('group') === '1';
+      if (params.get('exclude_dash') !== null) excludeUncached = params.get('exclude_dash') === '1';
+      if (params.get('smooth') !== null) smoothError = params.get('smooth') === '1';
+    }
+
+    function updateURL() {
+      const params = new URLSearchParams();
+      params.set('tab', currentTab);
+      params.set('interval', currentInterval);
+      if (currentDomain) params.set('domain', currentDomain);
+      params.set('window', currentWindow);
+      params.set('percent', modePercent ? '1' : '0');
+      params.set('group', modeGroup ? '1' : '0');
+      params.set('exclude_dash', excludeUncached ? '1' : '0');
+      params.set('smooth', smoothError ? '1' : '0');
+      const newUrl = `${location.pathname}?${params.toString()}`;
+      history.replaceState(null, '', newUrl);
+      saveState();
+    }
+
+    function bucketsForWindow(win, interval) {
+      switch (win) {
+        case '1h': return interval === 'hourly' ? 1 : 'all';
+        case '24h': return interval === 'hourly' ? 24 : 'all';
+        case '7d': return interval === 'daily' ? 7 : 'all';
+        case '30d': return interval === 'daily' ? 30 : 'all';
+        default: return 'all';
+      }
+    }
 
     function initReport(token, rep, base) {
       fetch(base + '/' + rep.json, { signal: token.controller.signal })
@@ -133,36 +260,92 @@
             return;
           }
 
+          // Transform pipeline (client-only)
+          let transformed = data.slice();
           const bucketField = bucketFields[0];
-          const labelsArr = data.map(x => x[bucketField]);
-          const values = data.map(x => x.value);
+          const isTimeSeries = bucketField === 'time_bucket';
+          // Exclusions (per-report) and explicit uncached toggle for cache_status
+          if (rep.exclude_values && rep.exclude_values.length) {
+            transformed = excludeValues(transformed, bucketField, rep.exclude_values);
+          }
+          if (excludeUncached && bucketField === 'cache_status') {
+            transformed = excludeValues(transformed, bucketField, ['-']);
+          }
+          // Windowing for time series
+          if (isTimeSeries) {
+            const n = bucketsForWindow(currentWindow, currentInterval);
+            transformed = sliceWindow(transformed, n);
+          }
+          // Distributions: percent + group small
+          const isDistribution = ['pie', 'polarArea', 'doughnut', 'donut'].includes(rep.chart);
+          if (isDistribution) {
+            if (modeGroup) {
+              const thr = (typeof rep.group_others_threshold === 'number') ? rep.group_others_threshold : 0.03;
+              transformed = groupOthers(transformed, bucketField, 'value', thr, 'Other');
+            }
+            if (modePercent) {
+              transformed = toPercent(transformed, 'value');
+            }
+          }
+          // Relabel '-' to 'Uncached' for cache_status distributions
+          if (bucketField === 'cache_status') {
+            transformed = transformed.map(row => ({
+              ...row,
+              [bucketField]: row[bucketField] === '-' ? 'Uncached' : row[bucketField]
+            }));
+          }
+
+          const labelsArr = transformed.map(x => x[bucketField]);
+          let values = transformed.map(x => x.value);
           const chartType = rep.chart === 'stackedBar' ? 'bar' : rep.chart;
           const options = { scales: { y: { beginAtZero: true } } };
+          let datasets = [];
           if (rep.chart === 'stackedBar') {
             options.scales.x = { stacked: true };
+            options.scales.y = options.scales.y || {};
             options.scales.y.stacked = true;
-          }
-          const dataset = {
-            label: rep.label,
-            data: values,
-            borderWidth: 1,
-            fill: rep.chart !== 'bar' && rep.chart !== 'stackedBar'
-          };
-          if (rep.colors) {
-            dataset.backgroundColor = rep.colors;
-            dataset.borderColor = rep.colors;
-          } else if (rep.color) {
-            dataset.backgroundColor = rep.color;
-            dataset.borderColor = rep.color;
+            // Build multiple series from columns (exclude bucket & total)
+            const keys = transformed.length ? Object.keys(transformed[0]).filter(k => k !== bucketField && k !== 'total') : [];
+            const palette = rep.colors || [
+              '#3273dc', '#23d160', '#ffdd57', '#ff3860', '#7957d5', '#363636'
+            ];
+            datasets = keys.map((k, i) => ({
+              label: k,
+              data: transformed.map(r => Number(r[k]) || 0),
+              backgroundColor: palette[i % palette.length],
+              borderColor: palette[i % palette.length],
+              borderWidth: 1,
+              fill: false,
+            }));
           } else {
-            dataset.backgroundColor = 'rgba(54, 162, 235, 0.5)';
-            dataset.borderColor = 'rgba(54, 162, 235, 1)';
+            const dataset = {
+              label: rep.label,
+              data: values,
+              borderWidth: 1,
+              fill: rep.chart !== 'bar' && rep.chart !== 'stackedBar'
+            };
+            if (rep.colors) {
+              dataset.backgroundColor = rep.colors;
+              dataset.borderColor = rep.colors;
+            } else if (rep.color) {
+              dataset.backgroundColor = rep.color;
+              dataset.borderColor = rep.color;
+            } else {
+              dataset.backgroundColor = 'rgba(54, 162, 235, 0.5)';
+              dataset.borderColor = 'rgba(54, 162, 235, 1)';
+            }
+            // Optional smoothing for error_rate
+            if (rep.name === 'error_rate' && smoothError) {
+              dataset.data = movingAverage(values, 3);
+              dataset.label = rep.label + ' (smoothed)';
+            }
+            datasets = [dataset];
           }
           const chart = new Chart(document.getElementById('chart-' + rep.name), {
             type: chartType,
             data: {
               labels: labelsArr,
-              datasets: [dataset]
+              datasets
             },
             options: options
           });
@@ -188,21 +371,11 @@
 
     function loadReports() {
       let path;
-      let container;
-      if (currentTab === 'overview') {
+      let container = containers[currentTab];
+      if (currentTab === 'recent') {
         path = 'global';
-        container = containers.overview;
-      } else if (currentTab === 'all') {
-        path = currentInterval;
-        container = containers.all;
       } else {
-        container = containers.domain;
-        if (!currentDomain) {
-          reset(container);
-          container.innerHTML = '<p>Select a domain</p>';
-          return;
-        }
-        path = 'domains/' + encodeURIComponent(currentDomain) + '/' + currentInterval;
+        path = currentDomain ? ('domains/' + encodeURIComponent(currentDomain) + '/' + currentInterval) : currentInterval;
       }
 
       const token = newLoad(container);
@@ -211,7 +384,15 @@
         .then(r => r.json())
         .then(reports => {
           if (token !== currentLoad) return;
-          reports.forEach(rep => {
+          const isDistributionType = t => ['pie','polarArea','doughnut','donut'].includes(t);
+          const filtered = reports.filter(rep => {
+            if (currentTab === 'recent') return true;
+            if (currentTab === 'trends') return rep.chart !== 'table' && !isDistributionType(rep.chart);
+            if (currentTab === 'distribution') return isDistributionType(rep.chart);
+            if (currentTab === 'tables') return rep.chart === 'table';
+            return true;
+          });
+          filtered.forEach(rep => {
             fetch(path + '/' + rep.html, { signal: token.controller.signal })
               .then(r => r.text())
               .then(html => {
@@ -313,9 +494,17 @@
       Object.entries(sections).forEach(([key, section]) => {
         section.classList.toggle('is-hidden', key !== name);
       });
-      intervalControl.classList.toggle('is-hidden', name === 'overview' || name === 'analysis');
-      domainControl.classList.toggle('is-hidden', name !== 'domain');
-      if (name === 'overview') {
+      const showInterval = name !== 'recent' && name !== 'analysis';
+      const showDomain = showInterval;
+      intervalControl.classList.toggle('is-hidden', !showInterval);
+      domainControl.classList.toggle('is-hidden', !showDomain);
+      windowControl.classList.toggle('is-hidden', !showInterval);
+      modePercentControl.classList.toggle('is-hidden', !showInterval);
+      modeGroupControl.classList.toggle('is-hidden', !showInterval);
+      excludeUncachedControl.classList.toggle('is-hidden', !showInterval);
+      smoothControl.classList.toggle('is-hidden', !showInterval);
+      updateURL();
+      if (name === 'recent') {
         loadStats();
       }
       if (name === 'analysis') {
@@ -328,23 +517,72 @@
     intervalSelect.addEventListener('change', () => {
       currentInterval = intervalSelect.value;
       abortLoad(currentLoad);
-      reset(containers.all);
-      reset(containers.domain);
+      Object.values(containers).forEach(reset);
+      updateURL();
       loadReports();
     });
 
     domainSelect.addEventListener('change', () => {
       currentDomain = domainSelect.value;
       abortLoad(currentLoad);
-      reset(containers.domain);
+      Object.values(containers).forEach(reset);
+      updateURL();
+      loadReports();
+    });
+
+    windowSelect.addEventListener('change', () => {
+      currentWindow = windowSelect.value;
+      abortLoad(currentLoad);
+      updateURL();
+      loadReports();
+    });
+
+    percentToggle.addEventListener('change', () => {
+      modePercent = percentToggle.checked;
+      abortLoad(currentLoad);
+      updateURL();
+      loadReports();
+    });
+
+    groupToggle.addEventListener('change', () => {
+      modeGroup = groupToggle.checked;
+      abortLoad(currentLoad);
+      updateURL();
+      loadReports();
+    });
+
+    excludeUncachedToggle.addEventListener('change', () => {
+      excludeUncached = excludeUncachedToggle.checked;
+      abortLoad(currentLoad);
+      updateURL();
+      loadReports();
+    });
+
+    smoothToggle.addEventListener('change', () => {
+      smoothError = smoothToggle.checked;
+      abortLoad(currentLoad);
+      updateURL();
       loadReports();
     });
 
     tabs.forEach(tab => {
-      tab.addEventListener('click', () => switchTab(tab.dataset.tab));
+      tab.addEventListener('click', () => {
+        switchTab(tab.dataset.tab);
+      });
     });
-
-    switchTab('overview');
+    // Initialize state (URL -> localStorage -> defaults)
+    loadSavedState();
+    applyURLParams();
+    // Sync controls
+    intervalSelect.value = currentInterval;
+    domainSelect.value = currentDomain;
+    windowSelect.value = currentWindow;
+    percentToggle.checked = modePercent;
+    groupToggle.checked = modeGroup;
+    excludeUncachedToggle.checked = excludeUncached;
+    smoothToggle.checked = smoothError;
+    // Show/hide controls based on active tab
+    switchTab(currentTab);
   </script>
 </body>
 </html>

From 6de85b7cc50536f5d13629e62bade6e8922f2292 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Mon, 18 Aug 2025 23:47:23 -0500
Subject: [PATCH 20/26] UX Phase 1 follow-ups: state v2 + reset, window
 defaults + support, palette support; analysis JSON generation; tests for
 LIMIT/metadata; README updates

---
 README.md                   | 17 ++++---
 run-reports.sh              |  4 ++
 scripts/generate_reports.py | 34 ++++++++++++++
 templates/index.html        | 64 +++++++++++++++++++++-----
 tests/test_reports.py       | 90 +++++++++++++++++++++++++++++++++++++
 5 files changed, 193 insertions(+), 16 deletions(-)

diff --git a/README.md b/README.md
index f641d96..ac601fc 100644
--- a/README.md
+++ b/README.md
@@ -39,9 +39,10 @@ all intervals in one go:
 ```
 
 The script calls `scripts/generate_reports.py` internally to create hourly,
-daily, weekly and monthly reports. Per-domain reports are written under
-`output/domains/<domain>` alongside the aggregate data. Open
-`output/index.html` in a browser to view the dashboard.
+daily, weekly and monthly reports, then writes analysis JSON files used by the
+"Analysis" tab. Per-domain reports are written under `output/domains/<domain>`
+alongside the aggregate data. Open `output/index.html` in a browser to view the
+dashboard.
 
 If you prefer to run individual commands you can invoke the generator directly:
 
@@ -54,8 +55,14 @@ python scripts/generate_reports.py daily --all-domains
 
 `run-analysis.sh` executes additional utilities that examine the database for
 missing domains, caching opportunities and potential threats. The JSON output is
-saved under `output/analysis` and appears in the "Analysis" tab of the
-dashboard.
+saved under `output/analysis` and appears in the "Analysis" tab. The
+`run-reports.sh` script also generates these JSON files as part of the build.
+
+## UX Controls
+
+The dashboard defaults to a 7‑day window for time series. Your view preferences
+persist locally in the browser under the `ngxstat-state-v2` key. Use the
+"Reset view" button to clear saved state and restore defaults.
 
 ```bash
 ./run-analysis.sh
diff --git a/run-reports.sh b/run-reports.sh
index bfe736d..4556f32 100755
--- a/run-reports.sh
+++ b/run-reports.sh
@@ -42,6 +42,10 @@ python scripts/generate_reports.py daily --all-domains
 python scripts/generate_reports.py weekly --all-domains
 python scripts/generate_reports.py monthly --all-domains
 
+# Generate analysis JSON
+echo "[INFO] Generating analysis files..."
+python scripts/generate_reports.py analysis
+
 # Generate root index
 python scripts/generate_reports.py index
 
diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 073e0b7..178951e 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -344,6 +344,34 @@ def _generate_global() -> None:
     typer.echo("Generated global reports")
 
 
+def _generate_analysis() -> None:
+    """Generate analysis JSON files consumed by the Analysis tab."""
+    try:
+        # Import lazily to avoid circulars and keep dependencies optional
+        from scripts import analyze
+    except Exception as exc:  # pragma: no cover - defensive
+        typer.echo(f"Failed to import analysis module: {exc}")
+        return
+
+    # Ensure output root and icons present for parity
+    _copy_icons()
+
+    # These commands write JSON files under output/analysis/
+    try:
+        analyze.check_missing_domains(json_output=True)
+    except Exception as exc:  # pragma: no cover - continue best-effort
+        typer.echo(f"check_missing_domains failed: {exc}")
+    try:
+        analyze.suggest_cache(json_output=True)
+    except Exception as exc:  # pragma: no cover
+        typer.echo(f"suggest_cache failed: {exc}")
+    try:
+        analyze.detect_threats()
+    except Exception as exc:  # pragma: no cover
+        typer.echo(f"detect_threats failed: {exc}")
+    typer.echo("Generated analysis JSON files")
+
+
 @app.command()
 def hourly(
     domain: Optional[str] = typer.Option(
@@ -414,6 +442,12 @@ def global_reports() -> None:
     _generate_global()
 
 
+@app.command()
+def analysis() -> None:
+    """Generate analysis JSON files for the Analysis tab."""
+    _generate_analysis()
+
+
 @app.command()
 def index() -> None:
     """Generate the root index page linking all reports."""
diff --git a/templates/index.html b/templates/index.html
index 56dfd6f..5b877ef 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -74,6 +74,9 @@
           <input type="checkbox" id="exclude-uncached-toggle" checked> Exclude “-”
         </label>
       </div>
+      <div id="reset-control" class="control">
+        <button id="reset-view" class="button is-small is-light">Reset view</button>
+      </div>
     </div>
 
     <div id="recent-section">
@@ -122,6 +125,7 @@
       groupOthers,
       movingAverage,
     } from './chartManager.js';
+    const STATE_KEY = 'ngxstat-state-v2';
     const intervalSelect = document.getElementById('interval-select');
     const domainSelect = document.getElementById('domain-select');
     const intervalControl = document.getElementById('interval-control');
@@ -131,6 +135,7 @@
     const modeGroupControl = document.getElementById('mode-group-control');
     const excludeUncachedControl = document.getElementById('exclude-uncached-control');
     const smoothControl = document.getElementById('smooth-control');
+    const resetButton = document.getElementById('reset-view');
     const tabs = document.querySelectorAll('#report-tabs li');
     const sections = {
       recent: document.getElementById('recent-section'),
@@ -172,10 +177,11 @@
     let modeGroup = true;
     let excludeUncached = true;
     let smoothError = false;
+    let hadExplicitWindow = false; // URL or saved-state provided window
 
     function saveState() {
       try {
-        localStorage.setItem('ngxstat-state', JSON.stringify({
+        localStorage.setItem(STATE_KEY, JSON.stringify({
           tab: currentTab,
           interval: currentInterval,
           domain: currentDomain,
@@ -190,11 +196,11 @@
 
     function loadSavedState() {
       try {
-        const s = JSON.parse(localStorage.getItem('ngxstat-state') || '{}');
+        const s = JSON.parse(localStorage.getItem(STATE_KEY) || '{}');
         if (s.tab) currentTab = s.tab;
         if (s.interval) currentInterval = s.interval;
         if (s.domain !== undefined) currentDomain = s.domain;
-        if (s.window) currentWindow = s.window;
+        if (s.window) { currentWindow = s.window; hadExplicitWindow = true; }
         if (s.percent !== undefined) modePercent = !!Number(s.percent);
         if (s.group !== undefined) modeGroup = !!Number(s.group);
         if (s.exclude_dash !== undefined) excludeUncached = !!Number(s.exclude_dash);
@@ -207,7 +213,7 @@
       if (params.get('tab')) currentTab = params.get('tab');
       if (params.get('interval')) currentInterval = params.get('interval');
       if (params.get('domain') !== null) currentDomain = params.get('domain') || '';
-      if (params.get('window')) currentWindow = params.get('window');
+      if (params.get('window')) { currentWindow = params.get('window'); hadExplicitWindow = true; }
       if (params.get('percent') !== null) modePercent = params.get('percent') === '1';
       if (params.get('group') !== null) modeGroup = params.get('group') === '1';
       if (params.get('exclude_dash') !== null) excludeUncached = params.get('exclude_dash') === '1';
@@ -273,8 +279,13 @@
           }
           // Windowing for time series
           if (isTimeSeries) {
-            const n = bucketsForWindow(currentWindow, currentInterval);
-            transformed = sliceWindow(transformed, n);
+            // Only apply windowing if report supports current window (if constrained)
+            const supported = Array.isArray(rep.windows_supported) ? rep.windows_supported : null;
+            const canWindow = !supported || supported.includes(currentWindow);
+            if (canWindow) {
+              const n = bucketsForWindow(currentWindow, currentInterval);
+              transformed = sliceWindow(transformed, n);
+            }
           }
           // Distributions: percent + group small
           const isDistribution = ['pie', 'polarArea', 'doughnut', 'donut'].includes(rep.chart);
@@ -306,7 +317,7 @@
             options.scales.y.stacked = true;
             // Build multiple series from columns (exclude bucket & total)
             const keys = transformed.length ? Object.keys(transformed[0]).filter(k => k !== bucketField && k !== 'total') : [];
-            const palette = rep.colors || [
+            const palette = rep.colors || rep.palette || [
               '#3273dc', '#23d160', '#ffdd57', '#ff3860', '#7957d5', '#363636'
             ];
             datasets = keys.map((k, i) => ({
@@ -327,6 +338,9 @@
             if (rep.colors) {
               dataset.backgroundColor = rep.colors;
               dataset.borderColor = rep.colors;
+            } else if (rep.palette) {
+              dataset.backgroundColor = rep.palette;
+              dataset.borderColor = rep.palette;
             } else if (rep.color) {
               dataset.backgroundColor = rep.color;
               dataset.borderColor = rep.color;
@@ -392,6 +406,15 @@
             if (currentTab === 'tables') return rep.chart === 'table';
             return true;
           });
+          // If no explicit window was given (URL or saved state), honor first report's default
+          if (!hadExplicitWindow) {
+            const withDefault = filtered.find(r => r.window_default);
+            if (withDefault && typeof withDefault.window_default === 'string') {
+              currentWindow = withDefault.window_default;
+              windowSelect.value = currentWindow;
+              updateURL();
+            }
+          }
           filtered.forEach(rep => {
             fetch(path + '/' + rep.html, { signal: token.controller.signal })
               .then(r => r.text())
@@ -499,10 +522,12 @@
       intervalControl.classList.toggle('is-hidden', !showInterval);
       domainControl.classList.toggle('is-hidden', !showDomain);
       windowControl.classList.toggle('is-hidden', !showInterval);
-      modePercentControl.classList.toggle('is-hidden', !showInterval);
-      modeGroupControl.classList.toggle('is-hidden', !showInterval);
-      excludeUncachedControl.classList.toggle('is-hidden', !showInterval);
-      smoothControl.classList.toggle('is-hidden', !showInterval);
+      // Only show percent/group/exclude toggles on Distribution tab,
+      // and smoothing only on Trends tab
+      modePercentControl.classList.toggle('is-hidden', name !== 'distribution');
+      modeGroupControl.classList.toggle('is-hidden', name !== 'distribution');
+      excludeUncachedControl.classList.toggle('is-hidden', name !== 'distribution');
+      smoothControl.classList.toggle('is-hidden', name !== 'trends');
       updateURL();
       if (name === 'recent') {
         loadStats();
@@ -570,6 +595,23 @@
         switchTab(tab.dataset.tab);
       });
     });
+    resetButton.addEventListener('click', () => {
+      try {
+        localStorage.removeItem('ngxstat-state'); // clear legacy
+        localStorage.removeItem(STATE_KEY);
+      } catch {}
+      // Reset to hard defaults
+      currentTab = 'recent';
+      currentInterval = intervalSelect.value = intervalSelect.options[0]?.value || currentInterval;
+      currentDomain = domainSelect.value = '';
+      currentWindow = windowSelect.value = '7d';
+      modePercent = percentToggle.checked = false;
+      modeGroup = groupToggle.checked = true;
+      excludeUncached = excludeUncachedToggle.checked = true;
+      smoothError = smoothToggle.checked = false;
+      hadExplicitWindow = false;
+      switchTab(currentTab);
+    });
     // Initialize state (URL -> localStorage -> defaults)
     loadSavedState();
     applyURLParams();
diff --git a/tests/test_reports.py b/tests/test_reports.py
index f6c6918..60a6df6 100644
--- a/tests/test_reports.py
+++ b/tests/test_reports.py
@@ -323,3 +323,93 @@ def test_multi_bucket_table(tmp_path, monkeypatch):
     entry = next(r for r in reports if r["name"] == "multi")
     assert entry["buckets"] == ["domain", "agent"]
     assert entry["bucket_label"] == ["Domain", "Agent"]
+
+
+def test_top_n_limit_applied(tmp_path, monkeypatch):
+    # Prepare DB with many distinct agents
+    db_path = tmp_path / "database" / "ngxstat.db"
+    setup_db(db_path)
+    conn = sqlite3.connect(db_path)
+    cur = conn.cursor()
+    for i in range(10):
+        cur.execute(
+            "INSERT INTO logs (ip, host, time, request, status, bytes_sent, referer, user_agent, cache_status) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)",
+            (
+                "127.0.0.1",
+                "example.com",
+                f"2024-01-01 11:{i:02d}:00",
+                "GET /x HTTP/1.1",
+                200,
+                100,
+                "-",
+                f"ua-{i}",
+                "MISS",
+            ),
+        )
+    conn.commit()
+    conn.close()
+
+    cfg = tmp_path / "reports.yml"
+    cfg.write_text(
+        """
+- name: agents
+  chart: table
+  global: true
+  top_n: 3
+  query: |
+    SELECT user_agent AS agent, COUNT(*) AS value
+    FROM logs
+    GROUP BY user_agent
+    ORDER BY value DESC
+"""
+    )
+
+    monkeypatch.setattr(gr, "DB_PATH", db_path)
+    monkeypatch.setattr(gr, "OUTPUT_DIR", tmp_path / "output")
+    monkeypatch.setattr(gr, "REPORT_CONFIG", cfg)
+    monkeypatch.setattr(
+        gr, "TEMPLATE_DIR", Path(__file__).resolve().parents[1] / "templates"
+    )
+
+    gr._generate_global()
+
+    data = json.loads((tmp_path / "output" / "global" / "agents.json").read_text())
+    # Should be limited to 3 rows
+    assert len(data) <= 3
+
+
+def test_metadata_passthrough(tmp_path, monkeypatch):
+    db_path = tmp_path / "database" / "ngxstat.db"
+    setup_db(db_path)
+
+    cfg = tmp_path / "reports.yml"
+    cfg.write_text(
+        """
+- name: custom_ts
+  label: Custom TS
+  chart: line
+  window_default: 24h
+  windows_supported: [1h, 24h, 7d]
+  palette: ["#111111", "#222222"]
+  query: |
+    SELECT {bucket} AS time_bucket, COUNT(*) AS value
+    FROM logs
+    GROUP BY time_bucket
+    ORDER BY time_bucket
+"""
+    )
+
+    monkeypatch.setattr(gr, "DB_PATH", db_path)
+    monkeypatch.setattr(gr, "OUTPUT_DIR", tmp_path / "output")
+    monkeypatch.setattr(gr, "REPORT_CONFIG", cfg)
+    monkeypatch.setattr(
+        gr, "TEMPLATE_DIR", Path(__file__).resolve().parents[1] / "templates"
+    )
+
+    gr._generate_interval("hourly")
+
+    reports = json.loads((tmp_path / "output" / "hourly" / "reports.json").read_text())
+    entry = next(r for r in reports if r["name"] == "custom_ts")
+    assert entry["window_default"] == "24h"
+    assert entry["windows_supported"] == ["1h", "24h", "7d"]
+    assert entry["palette"] == ["#111111", "#222222"]

From 95e54359d7cc0289655161d0f271b533f9dcf7a1 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:09:49 -0500
Subject: [PATCH 21/26] UX: unify time selection and simplify controls\n\n-
 Replace separate Interval + Window with a single Time preset (Last
 hour/24h/7d/30d/12w/12m/All time)\n- Map presets to sensible grouping
 (hourly/daily/weekly/monthly) based on available intervals\n- Keep backward
 compatibility: preserve existing URL/state params; keep legacy controls
 hidden\n- Add client support for new windows (12w, 12m) in time-bucket
 slicing\n- Show only relevant controls per tab (Trends: smoothing;
 Distribution: percent/group/exclude)\n- Streamline reset flow to a sane
 default (Last 7 days)

---
 templates/index.html | 133 +++++++++++++++++++++++++++++++++----------
 1 file changed, 102 insertions(+), 31 deletions(-)

diff --git a/templates/index.html b/templates/index.html
index 5b877ef..7e16527 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -21,6 +21,7 @@
     </div>
 
     <div id="controls" class="field is-grouped is-align-items-center mb-4" style="position: sticky; top: 0; background: white; z-index: 2; padding: 0.5rem 0;">
+      <!-- Hidden native interval control kept for compatibility and availability probing -->
       <div id="interval-control" class="control has-icons-left is-hidden">
         <div class="select is-small">
           <select id="interval-select">
@@ -42,17 +43,20 @@
         </div>
         <span class="icon is-small is-left"><img src="icons/server.svg" alt="Domain"></span>
       </div>
-      <div id="window-control" class="control has-icons-left is-hidden">
+      <!-- Unified Time control: selects both range and sensible grouping -->
+      <div id="time-control" class="control has-icons-left is-hidden">
         <div class="select is-small">
-          <select id="window-select">
-            <option value="1h">Last 1h</option>
-            <option value="24h">Last 24h</option>
-            <option value="7d" selected>Last 7d</option>
-            <option value="30d">Last 30d</option>
-            <option value="all">All</option>
+          <select id="time-select">
+            <option value="1h">Last hour</option>
+            <option value="24h">Last 24 hours</option>
+            <option value="7d" selected>Last 7 days</option>
+            <option value="30d">Last 30 days</option>
+            <option value="12w">Last 12 weeks</option>
+            <option value="12m">Last 12 months</option>
+            <option value="all">All time</option>
           </select>
         </div>
-        <span class="icon is-small is-left"><img src="icons/pulse.svg" alt="Window"></span>
+        <span class="icon is-small is-left"><img src="icons/clock.svg" alt="Time"></span>
       </div>
       <div id="smooth-control" class="control is-hidden">
         <label class="checkbox is-small">
@@ -130,7 +134,8 @@
     const domainSelect = document.getElementById('domain-select');
     const intervalControl = document.getElementById('interval-control');
     const domainControl = document.getElementById('domain-control');
-    const windowControl = document.getElementById('window-control');
+    const timeControl = document.getElementById('time-control');
+    const timeSelect = document.getElementById('time-select');
     const modePercentControl = document.getElementById('mode-percent-control');
     const modeGroupControl = document.getElementById('mode-group-control');
     const excludeUncachedControl = document.getElementById('exclude-uncached-control');
@@ -163,7 +168,25 @@
     const elapsedElem = document.getElementById('stat-elapsed');
 
     // Extra controls
+    // Legacy window select kept for internal state only (not shown)
     const windowSelect = document.getElementById('window-select');
+    
+    // If legacy window select is not present in DOM, create a hidden one for code paths
+    // that still reference it.
+    (function ensureHiddenWindowSelect(){
+      if (!windowSelect) {
+        const hidden = document.createElement('select');
+        hidden.id = 'window-select';
+        hidden.classList.add('is-hidden');
+        // Supported values used by code
+        ['1h','24h','7d','30d','12w','12m','all'].forEach(v => {
+          const o = document.createElement('option');
+          o.value = v; o.textContent = v;
+          hidden.appendChild(o);
+        });
+        document.body.appendChild(hidden);
+      }
+    })();
     const percentToggle = document.getElementById('percent-toggle');
     const groupToggle = document.getElementById('group-toggle');
     const excludeUncachedToggle = document.getElementById('exclude-uncached-toggle');
@@ -172,7 +195,7 @@
     let currentInterval = intervalSelect.value;
     let currentDomain = domainSelect.value;
     let currentTab = 'recent';
-    let currentWindow = windowSelect.value; // 1h, 24h, 7d, 30d, all
+    let currentWindow = windowSelect ? windowSelect.value : '7d'; // 1h, 24h, 7d, 30d, 12w, 12m, all
     let modePercent = false;
     let modeGroup = true;
     let excludeUncached = true;
@@ -241,10 +264,46 @@
         case '24h': return interval === 'hourly' ? 24 : 'all';
         case '7d': return interval === 'daily' ? 7 : 'all';
         case '30d': return interval === 'daily' ? 30 : 'all';
+        case '12w': return interval === 'weekly' ? 12 : 'all';
+        case '12m': return interval === 'monthly' ? 12 : 'all';
         default: return 'all';
       }
     }
 
+    function availableIntervals() {
+      try {
+        return Array.from(intervalSelect ? intervalSelect.options : []).map(o => o.value);
+      } catch { return []; }
+    }
+
+    function pickIntervalForWindow(win) {
+      const avail = availableIntervals();
+      const pref = (list) => list.find(x => avail.includes(x));
+      switch (win) {
+        case '1h':
+        case '24h':
+          return pref(['hourly','daily','weekly','monthly']) || (avail[0] || 'daily');
+        case '7d':
+        case '30d':
+          return pref(['daily','weekly','monthly','hourly']) || (avail[0] || 'daily');
+        case '12w':
+          return pref(['weekly','daily','monthly']) || (avail[0] || 'weekly');
+        case '12m':
+          return pref(['monthly','weekly','daily']) || (avail[0] || 'monthly');
+        default:
+          // all time: favor coarser buckets if available
+          return pref(['monthly','weekly','daily','hourly']) || (avail[0] || 'weekly');
+      }
+    }
+
+    function applyTimePreset(win) {
+      currentWindow = win;
+      currentInterval = pickIntervalForWindow(win);
+      if (intervalSelect) intervalSelect.value = currentInterval;
+      const winSel = document.getElementById('window-select');
+      if (winSel) winSel.value = currentWindow;
+    }
+
     function initReport(token, rep, base) {
       fetch(base + '/' + rep.json, { signal: token.controller.signal })
         .then(r => r.json())
@@ -517,11 +576,12 @@
       Object.entries(sections).forEach(([key, section]) => {
         section.classList.toggle('is-hidden', key !== name);
       });
-      const showInterval = name !== 'recent' && name !== 'analysis';
-      const showDomain = showInterval;
-      intervalControl.classList.toggle('is-hidden', !showInterval);
+      const showTime = name !== 'recent' && name !== 'analysis';
+      const showDomain = showTime;
+      // Always keep legacy interval control hidden; use unified time control
+      intervalControl.classList.add('is-hidden');
       domainControl.classList.toggle('is-hidden', !showDomain);
-      windowControl.classList.toggle('is-hidden', !showInterval);
+      timeControl.classList.toggle('is-hidden', !showTime);
       // Only show percent/group/exclude toggles on Distribution tab,
       // and smoothing only on Trends tab
       modePercentControl.classList.toggle('is-hidden', name !== 'distribution');
@@ -539,13 +599,15 @@
       }
     }
 
-    intervalSelect.addEventListener('change', () => {
-      currentInterval = intervalSelect.value;
-      abortLoad(currentLoad);
-      Object.values(containers).forEach(reset);
-      updateURL();
-      loadReports();
-    });
+    if (intervalSelect) {
+      intervalSelect.addEventListener('change', () => {
+        currentInterval = intervalSelect.value;
+        abortLoad(currentLoad);
+        Object.values(containers).forEach(reset);
+        updateURL();
+        loadReports();
+      });
+    }
 
     domainSelect.addEventListener('change', () => {
       currentDomain = domainSelect.value;
@@ -555,12 +617,14 @@
       loadReports();
     });
 
-    windowSelect.addEventListener('change', () => {
-      currentWindow = windowSelect.value;
-      abortLoad(currentLoad);
-      updateURL();
-      loadReports();
-    });
+    if (timeSelect) {
+      timeSelect.addEventListener('change', () => {
+        applyTimePreset(timeSelect.value);
+        abortLoad(currentLoad);
+        updateURL();
+        loadReports();
+      });
+    }
 
     percentToggle.addEventListener('change', () => {
       modePercent = percentToggle.checked;
@@ -602,9 +666,10 @@
       } catch {}
       // Reset to hard defaults
       currentTab = 'recent';
-      currentInterval = intervalSelect.value = intervalSelect.options[0]?.value || currentInterval;
+      currentInterval = intervalSelect ? (intervalSelect.value = intervalSelect.options[0]?.value || currentInterval) : currentInterval;
       currentDomain = domainSelect.value = '';
-      currentWindow = windowSelect.value = '7d';
+      applyTimePreset('7d');
+      if (timeSelect) timeSelect.value = '7d';
       modePercent = percentToggle.checked = false;
       modeGroup = groupToggle.checked = true;
       excludeUncached = excludeUncachedToggle.checked = true;
@@ -616,9 +681,15 @@
     loadSavedState();
     applyURLParams();
     // Sync controls
-    intervalSelect.value = currentInterval;
+    if (intervalSelect) intervalSelect.value = currentInterval;
     domainSelect.value = currentDomain;
-    windowSelect.value = currentWindow;
+    // Sync unified time select based on state
+    if (timeSelect) {
+      const known = new Set(['1h','24h','7d','30d','12w','12m','all']);
+      const pick = known.has(currentWindow) ? currentWindow : 'all';
+      timeSelect.value = pick;
+      applyTimePreset(pick);
+    }
     percentToggle.checked = modePercent;
     groupToggle.checked = modeGroup;
     excludeUncachedToggle.checked = excludeUncached;

From 2bfd487106314b30b49936ab7675b3791ceb8159 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:28:42 -0500
Subject: [PATCH 22/26] UX: merge Distribution and Tables into a single
 Breakdown tab with clear option help\n\n- Replace separate
 Distribution/Tables tabs with one Breakdown tab\n- Breakdown shows
 categorical charts and data tables together\n- Add in-page help explaining
 Percent mode, Grouping, and Exclude '-'\n- Update filtering, containers, and
 tab logic to target new tab\n- Keep existing report JSON/HTML contracts; no
 server changes required

---
 templates/index.html | 43 ++++++++++++++++++++++---------------------
 1 file changed, 22 insertions(+), 21 deletions(-)

diff --git a/templates/index.html b/templates/index.html
index 7e16527..41307d7 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -14,8 +14,7 @@
       <ul>
         <li class="is-active" data-tab="recent"><a>Recent</a></li>
         <li data-tab="trends"><a>Trends</a></li>
-        <li data-tab="distribution"><a>Distribution</a></li>
-        <li data-tab="tables"><a>Tables</a></li>
+        <li data-tab="breakdown"><a>Breakdown</a></li>
         <li data-tab="analysis"><a>Analysis</a></li>
       </ul>
     </div>
@@ -64,17 +63,17 @@
         </label>
       </div>
       <div id="mode-percent-control" class="control is-hidden">
-        <label class="checkbox is-small">
+        <label class="checkbox is-small" title="Show values as a percentage of the total, instead of raw counts.">
           <input type="checkbox" id="percent-toggle"> Percent mode
         </label>
       </div>
       <div id="mode-group-control" class="control is-hidden">
-        <label class="checkbox is-small">
+        <label class="checkbox is-small" title="Combine small categories into an 'Other' slice to declutter charts.">
           <input type="checkbox" id="group-toggle" checked> Group small into Other
         </label>
       </div>
       <div id="exclude-uncached-control" class="control is-hidden">
-        <label class="checkbox is-small">
+        <label class="checkbox is-small" title="Hide uncached entries (cache status '-') from cache status distributions.">
           <input type="checkbox" id="exclude-uncached-toggle" checked> Exclude “-”
         </label>
       </div>
@@ -99,12 +98,17 @@
       <div id="reports-trends"></div>
     </div>
 
-    <div id="distribution-section" class="is-hidden">
-      <div id="reports-distribution"></div>
-    </div>
-
-    <div id="tables-section" class="is-hidden">
-      <div id="reports-tables"></div>
+    <div id="breakdown-section" class="is-hidden">
+      <div class="box mb-4">
+        <h2 class="subtitle">Breakdown</h2>
+        <p class="mb-2">Explore categorical distributions and detailed lists side-by-side. Use the options below to adjust how categories are shown.</p>
+        <ul style="margin-left: 1.2rem; list-style: disc;">
+          <li><strong>Percent mode</strong>: converts counts into percentages of the total for easier comparison.</li>
+          <li><strong>Group small into Other</strong>: combines tiny slices under a single “Other” category to declutter charts.</li>
+          <li><strong>Exclude “-”</strong>: hides uncached entries (cache status “-”) from cache status distributions.</li>
+        </ul>
+      </div>
+      <div id="reports-breakdown"></div>
     </div>
 
   <div id="analysis-section" class="is-hidden">
@@ -145,15 +149,13 @@
     const sections = {
       recent: document.getElementById('recent-section'),
       trends: document.getElementById('trends-section'),
-      distribution: document.getElementById('distribution-section'),
-      tables: document.getElementById('tables-section'),
+      breakdown: document.getElementById('breakdown-section'),
       analysis: document.getElementById('analysis-section')
     };
     const containers = {
       recent: document.getElementById('overview-reports'),
       trends: document.getElementById('reports-trends'),
-      distribution: document.getElementById('reports-distribution'),
-      tables: document.getElementById('reports-tables')
+      breakdown: document.getElementById('reports-breakdown')
     };
     const analysisElems = {
       missing: document.getElementById('analysis-missing'),
@@ -461,8 +463,7 @@
           const filtered = reports.filter(rep => {
             if (currentTab === 'recent') return true;
             if (currentTab === 'trends') return rep.chart !== 'table' && !isDistributionType(rep.chart);
-            if (currentTab === 'distribution') return isDistributionType(rep.chart);
-            if (currentTab === 'tables') return rep.chart === 'table';
+            if (currentTab === 'breakdown') return isDistributionType(rep.chart) || rep.chart === 'table';
             return true;
           });
           // If no explicit window was given (URL or saved state), honor first report's default
@@ -582,11 +583,11 @@
       intervalControl.classList.add('is-hidden');
       domainControl.classList.toggle('is-hidden', !showDomain);
       timeControl.classList.toggle('is-hidden', !showTime);
-      // Only show percent/group/exclude toggles on Distribution tab,
+      // Only show percent/group/exclude toggles on Breakdown tab,
       // and smoothing only on Trends tab
-      modePercentControl.classList.toggle('is-hidden', name !== 'distribution');
-      modeGroupControl.classList.toggle('is-hidden', name !== 'distribution');
-      excludeUncachedControl.classList.toggle('is-hidden', name !== 'distribution');
+      modePercentControl.classList.toggle('is-hidden', name !== 'breakdown');
+      modeGroupControl.classList.toggle('is-hidden', name !== 'breakdown');
+      excludeUncachedControl.classList.toggle('is-hidden', name !== 'breakdown');
       smoothControl.classList.toggle('is-hidden', name !== 'trends');
       updateURL();
       if (name === 'recent') {

From 8eec623c9274c198c5e7811fb9c894f969d29694 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:36:41 -0500
Subject: [PATCH 23/26] reports: use timezone-aware UTC for timestamps\n\n-
 Replace deprecated datetime.utcnow() with datetime.now(timezone.utc)\n- Keeps
 existing human-friendly format while avoiding deprecation warnings\n- Applies
 to marker file and generated_at in stats

---
 scripts/generate_reports.py | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 178951e..118d2dc 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -3,7 +3,7 @@ import sqlite3
 from pathlib import Path
 import shutil
 from typing import List, Dict, Optional
-from datetime import datetime
+from datetime import datetime, timezone
 import time
 
 import yaml
@@ -37,7 +37,8 @@ def _cli_callback(ctx: typer.Context) -> None:
 
     def _write_marker() -> None:
         OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
-        timestamp = datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S")
+        # Use timezone-aware UTC to avoid deprecation warnings and ambiguity
+        timestamp = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S")
         GENERATED_MARKER.write_text(f"{timestamp}\n")
 
     ctx.call_on_close(_write_marker)
@@ -271,7 +272,8 @@ def _generate_global() -> None:
         return
 
     start_time = time.time()
-    generated_at = datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S")
+    # Use timezone-aware UTC for generated_at (string remains unchanged format)
+    generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S")
 
     _copy_icons()
 

From f0ed112626151ae2e6f50a230b467307c67c5dc1 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:40:07 -0500
Subject: [PATCH 24/26] reports: fix analysis import error when run as a
 script\n\n- Prepend project root to sys.path in scripts/generate_reports.py
 to allow  when executed via path\n- Update run-reports.sh to invoke the
 generator as a module () for robust imports\n- Keeps CLI behavior the same
 while eliminating 'No module named scripts'

---
 run-reports.sh              | 22 +++++++++++-----------
 scripts/generate_reports.py |  6 ++++++
 2 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/run-reports.sh b/run-reports.sh
index 4556f32..f7cffba 100755
--- a/run-reports.sh
+++ b/run-reports.sh
@@ -29,25 +29,25 @@ fi
 
 # Generate reports for all domains combined
 echo "[INFO] Generating aggregate reports..."
-python scripts/generate_reports.py hourly
-python scripts/generate_reports.py daily
-python scripts/generate_reports.py weekly
-python scripts/generate_reports.py monthly
-python scripts/generate_reports.py global
+python -m scripts.generate_reports hourly
+python -m scripts.generate_reports daily
+python -m scripts.generate_reports weekly
+python -m scripts.generate_reports monthly
+python -m scripts.generate_reports global
 
 # Generate reports for each individual domain
 echo "[INFO] Generating per-domain reports..."
-python scripts/generate_reports.py hourly --all-domains
-python scripts/generate_reports.py daily --all-domains
-python scripts/generate_reports.py weekly --all-domains
-python scripts/generate_reports.py monthly --all-domains
+python -m scripts.generate_reports hourly --all-domains
+python -m scripts.generate_reports daily --all-domains
+python -m scripts.generate_reports weekly --all-domains
+python -m scripts.generate_reports monthly --all-domains
 
 # Generate analysis JSON
 echo "[INFO] Generating analysis files..."
-python scripts/generate_reports.py analysis
+python -m scripts.generate_reports analysis
 
 # Generate root index
-python scripts/generate_reports.py index
+python -m scripts.generate_reports index
 
 # Deactivate to keep cron environment clean
 if type deactivate >/dev/null 2>&1; then
diff --git a/scripts/generate_reports.py b/scripts/generate_reports.py
index 118d2dc..d3c2f8a 100644
--- a/scripts/generate_reports.py
+++ b/scripts/generate_reports.py
@@ -1,4 +1,5 @@
 import json
+import sys
 import sqlite3
 from pathlib import Path
 import shutil
@@ -11,6 +12,11 @@ import yaml
 import typer
 from jinja2 import Environment, FileSystemLoader
 
+# Ensure project root is importable when running as a script (python scripts/generate_reports.py)
+PROJECT_ROOT = Path(__file__).resolve().parent.parent
+if str(PROJECT_ROOT) not in sys.path:
+    sys.path.insert(0, str(PROJECT_ROOT))
+
 DB_PATH = Path("database/ngxstat.db")
 OUTPUT_DIR = Path("output")
 TEMPLATE_DIR = Path("templates")

From 359d69c3e9beeac935a4c7d2677f70b2b97538e6 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:48:32 -0500
Subject: [PATCH 25/26] Recent: place Cache Status and HTTP Statuses
 side-by-side in a single row\n\n- Add a Bulma columns row in Recent
 section\n- Route the two key distribution charts into two half-width
 columns\n- Leave other global reports stacked below as before

---
 templates/index.html | 18 +++++++++++++++++-
 1 file changed, 17 insertions(+), 1 deletion(-)

diff --git a/templates/index.html b/templates/index.html
index 41307d7..a5de3db 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -91,6 +91,8 @@
         <p>Last generated: <span id="stat-generated">-</span></p>
         <p>Generation time: <span id="stat-elapsed">-</span> seconds</p>
       </div>
+      <!-- Two key distributions side-by-side on Recent -->
+      <div id="recent-row" class="columns"></div>
       <div id="overview-reports"></div>
     </div>
 
@@ -157,6 +159,7 @@
       trends: document.getElementById('reports-trends'),
       breakdown: document.getElementById('reports-breakdown')
     };
+    const recentRow = document.getElementById('recent-row');
     const analysisElems = {
       missing: document.getElementById('analysis-missing'),
       cache: document.getElementById('analysis-cache'),
@@ -453,6 +456,11 @@
         path = currentDomain ? ('domains/' + encodeURIComponent(currentDomain) + '/' + currentInterval) : currentInterval;
       }
 
+      // Clear the top row on each load of Recent
+      if (currentTab === 'recent' && recentRow) {
+        recentRow.innerHTML = '';
+      }
+
       const token = newLoad(container);
 
       fetch(path + '/reports.json', { signal: token.controller.signal })
@@ -480,7 +488,15 @@
               .then(r => r.text())
               .then(html => {
                 if (token !== currentLoad) return;
-                container.insertAdjacentHTML('beforeend', html);
+                // On Recent tab, render Cache Status and HTTP Statuses side-by-side
+                const inTopRow = currentTab === 'recent' &&
+                  (rep.name === 'cache_status_breakdown' || rep.name === 'status_distribution');
+                if (inTopRow && recentRow) {
+                  const wrapped = `<div class="column is-half">${html}</div>`;
+                  recentRow.insertAdjacentHTML('beforeend', wrapped);
+                } else {
+                  container.insertAdjacentHTML('beforeend', html);
+                }
                 initReport(token, rep, path);
               });
           });

From 371719799192a775c91c5be1c71a40a50dcbb243 Mon Sep 17 00:00:00 2001
From: ngxstat-bot <bot@ngxstat.local>
Date: Tue, 19 Aug 2025 00:51:10 -0500
Subject: [PATCH 26/26] analysis: make suggest_cache and detect_threats
 pure-callable, add CLI wrappers\n\n- Replace Typer Option defaults with plain
 Python defaults in functions used by generator/tests\n- Add CLI wrapper
 commands (, ) that delegate to the pure functions\n- Cast params to int for
 SQL/timedelta to avoid type issues\n- Resolves OptionInfo errors during
 run-reports analysis phase

---
 scripts/analyze.py | 32 +++++++++++++++++++++++---------
 1 file changed, 23 insertions(+), 9 deletions(-)

diff --git a/scripts/analyze.py b/scripts/analyze.py
index 7c4c141..9f49978 100644
--- a/scripts/analyze.py
+++ b/scripts/analyze.py
@@ -155,10 +155,9 @@ def check_missing_domains(
             typer.echo(d)
 
 
-@app.command("suggest-cache")
 def suggest_cache(
-    threshold: int = typer.Option(10, help="Minimum number of MISS entries to report"),
-    json_output: bool = typer.Option(False, "--json", help="Output results as JSON"),
+    threshold: int = 10,
+    json_output: bool = False,
 ) -> None:
     """Suggest domain/path pairs that could benefit from caching.
 
@@ -191,7 +190,7 @@ def suggest_cache(
         HAVING miss_count >= ?
         ORDER BY miss_count DESC
         """,
-        (threshold,),
+        (int(threshold),),
     )
 
     rows = [r for r in cur.fetchall() if r[0] in no_cache]
@@ -211,11 +210,18 @@ def suggest_cache(
         for item in result:
             typer.echo(f"{item['host']} {item['path']} {item['misses']}")
 
+@app.command("suggest-cache")
+def suggest_cache_cli(
+    threshold: int = typer.Option(10, help="Minimum number of MISS entries to report"),
+    json_output: bool = typer.Option(False, "--json", help="Output results as JSON"),
+) -> None:
+    """CLI wrapper for suggest_cache."""
+    suggest_cache(threshold=threshold, json_output=json_output)
+
 
-@app.command("detect-threats")
 def detect_threats(
-    hours: int = typer.Option(1, help="Number of recent hours to analyze"),
-    ip_threshold: int = typer.Option(100, help="Requests from a single IP to flag"),
+    hours: int = 1,
+    ip_threshold: int = 100,
 ) -> None:
     """Detect potential security threats from recent logs."""
 
@@ -231,8 +237,8 @@ def detect_threats(
 
     max_dt = datetime.strptime(row[0], "%Y-%m-%d %H:%M:%S")
     recent_end = max_dt
-    recent_start = recent_end - timedelta(hours=hours)
-    prev_start = recent_start - timedelta(hours=hours)
+    recent_start = recent_end - timedelta(hours=int(hours))
+    prev_start = recent_start - timedelta(hours=int(hours))
     prev_end = recent_start
 
     fmt = "%Y-%m-%d %H:%M:%S"
@@ -339,6 +345,14 @@ def detect_threats(
     out_path.write_text(json.dumps(report, indent=2))
     typer.echo(json.dumps(report))
 
+@app.command("detect-threats")
+def detect_threats_cli(
+    hours: int = typer.Option(1, help="Number of recent hours to analyze"),
+    ip_threshold: int = typer.Option(100, help="Requests from a single IP to flag"),
+) -> None:
+    """CLI wrapper for detect_threats."""
+    detect_threats(hours=hours, ip_threshold=ip_threshold)
+
 
 if __name__ == "__main__":
     app()