il y a 1 semaine · 8e4f815b37
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
--- a/backend/app/core/database.py
+++ b/backend/app/core/database.py
@@ -2519,6 +2519,78 @@ async def run_migrations(conn):
 
															         conn, "CREATE INDEX IF NOT EXISTS ix_print_log_entries_archive_id ON print_log_entries (archive_id)"
														
 
															     )
														
 
															+    # Backfill PrintLogEntry → PrintArchive linkage and per-event cost/energy
														
 
															+    # for pre-#1378 rows the column-add migration left NULL (#1390).
														
 
															+    #
														
 
															+    # Without this backfill the user's Quick Stats show Filament Cost = 0 and
														
 
															+    # Time Accuracy empty even though their archives carry both, because:
														
 
															+    #
														
 
															+    #   - the new stats queries SUM PrintLogEntry.cost (NULL for old rows)
														
 
															+    #   - the time-accuracy query JOINs PrintArchive ON archive_id (NULL for
														
 
															+    #     old rows, so old runs get excluded from the average)
														
 
															+    #
														
 
															+    # Pre-#1378, archive.cost / energy_kwh / energy_cost were overwritten by
														
 
															+    # each rerun, so the current archive values represent the *latest* run.
														
 
															+    # Backfilling them onto the latest matching PrintLogEntry per archive
														
 
															+    # reconstructs the pre-fix total exactly (sum across archives stays
														
 
															+    # unchanged), and leaves earlier reprints with NULL cost so they
														
 
															+    # contribute zero — matching the "first/latest writes, rest stay NULL"
														
 
															+    # convention #1378 introduced for new prints.
														
 
															+    #
														
 
															+    # DML, not DDL — use conn.execute() inside a savepoint per _safe_execute's
														
 
															+    # own docstring. SQL is plain ANSI (correlated UPDATE, MAX/GROUP BY/HAVING,
														
 
															+    # CASE in HAVING) and runs unchanged on SQLite + PostgreSQL; verified
														
 
															+    # against postgres:16-alpine + asyncpg.
														
 
															+    #
														
 
															+    # Step 1: link old log entries to their archive via print_name + printer_id.
														
 
															+    # Picks the highest-id matching archive when multiple share the same key
														
 
															+    # (newest archive wins — closest to the log's overwrite-then-leave shape).
														
 
															+    from sqlalchemy import text as _text
														
 
															+
														
 
															+    async with conn.begin_nested():
														
 
															+        await conn.execute(
														
 
															+            _text("""
														
 
															+            UPDATE print_log_entries
														
 
															+            SET archive_id = (
														
 
															+                SELECT a.id
														
 
															+                FROM print_archives a
														
 
															+                WHERE a.print_name = print_log_entries.print_name
														
 
															+                  AND (
														
 
															+                      a.printer_id = print_log_entries.printer_id
														
 
															+                      OR (a.printer_id IS NULL AND print_log_entries.printer_id IS NULL)
														
 
															+                  )
														
 
															+                ORDER BY a.id DESC
														
 
															+                LIMIT 1
														
 
															+            )
														
 
															+            WHERE archive_id IS NULL AND print_name IS NOT NULL
														
 
															+            """)
														
 
															+        )
														
 
															+
														
 
															+    # Step 2: backfill cost / energy_kwh / energy_cost onto the latest linked
														
 
															+    # log entry per archive — the row whose creation time best matches the
														
 
															+    # value currently stored on the archive (overwrite-on-reprint semantics
														
 
															+    # under the old design). Only fires for archives where NO log entry has
														
 
															+    # cost set yet, which gives the migration a clean idempotency property:
														
 
															+    # the second pass sees the archive already has a cost-bearing run and
														
 
															+    # leaves the rest of its history NULL (instead of marching up the
														
 
															+    # ID-ordered list of NULL runs on every pass).
														
 
															+    async with conn.begin_nested():
														
 
															+        await conn.execute(
														
 
															+            _text("""
														
 
															+            UPDATE print_log_entries
														
 
															+            SET cost = (SELECT cost FROM print_archives WHERE id = print_log_entries.archive_id),
														
 
															+                energy_kwh = (SELECT energy_kwh FROM print_archives WHERE id = print_log_entries.archive_id),
														
 
															+                energy_cost = (SELECT energy_cost FROM print_archives WHERE id = print_log_entries.archive_id)
														
 
															+            WHERE id IN (
														
 
															+                SELECT MAX(id)
														
 
															+                FROM print_log_entries
														
 
															+                WHERE archive_id IS NOT NULL
														
 
															+                GROUP BY archive_id
														
 
															+                HAVING SUM(CASE WHEN cost IS NOT NULL THEN 1 ELSE 0 END) = 0
														
 
															+            )
														
 
															+            """)
														
 
															+        )
														
 
															+
														
 
															 async def seed_notification_templates():
														
 
															     """Seed default notification templates if they don't exist."""
														
--- a/backend/tests/unit/test_print_log_backfill_migration.py
+++ b/backend/tests/unit/test_print_log_backfill_migration.py
@@ -0,0 +1,247 @@
 
															+"""Regression test for the PrintLogEntry → PrintArchive backfill migration (#1390).
														
 
															+
														
 
															+Reporter IndividualGhost1905 upgraded to 0.2.4.1 (which shipped the per-event
														
 
															+aggregation rewrite from #1378) and saw Quick Stats partially break on old
														
 
															+data:
														
 
															+
														
 
															+  - Total Filament Cost = 0 (PrintLogEntry.cost was NULL on pre-upgrade rows)
														
 
															+  - Time Accuracy empty for pre-upgrade runs (the new query JOINs on
														
 
															+    archive_id, which the column-add migration left NULL)
														
 
															+
														
 
															+#1378's migration added the columns but didn't backfill anything. This test
														
 
															+pins the backfill that the same `run_migrations` pass now performs:
														
 
															+
														
 
															+  Step 1: link old log entries to their archive via print_name + printer_id.
														
 
															+  Step 2: copy archive.cost / energy_kwh / energy_cost onto the latest
														
 
															+          matching log entry per archive (so the sum across archives
														
 
															+          reproduces the pre-fix total exactly — pre-#1378, archive.cost
														
 
															+          held the LATEST run's value because reprints overwrote it).
														
 
															+
														
 
															+Earlier reprints stay with cost = NULL — matching #1378's "first/latest run
														
 
															+writes, the rest stay NULL" convention for new prints, so reruns don't
														
 
															+double-count.
														
 
															+"""
														
 
															+
														
 
															+from __future__ import annotations
														
 
															+
														
 
															+from datetime import datetime, timedelta, timezone
														
 
															+
														
 
															+import pytest
														
 
															+from sqlalchemy import text
														
 
															+from sqlalchemy.ext.asyncio import create_async_engine
														
 
															+
														
 
															+from backend.app.core.database import run_migrations
														
 
															+
														
 
															+
														
 
															+@pytest.fixture(autouse=True)
														
 
															+def force_sqlite_dialect(monkeypatch):
														
 
															+    """Force the SQLite branch in run_migrations regardless of test env settings."""
														
 
															+    from backend.app.core import db_dialect
														
 
															+
														
 
															+    monkeypatch.setattr(db_dialect, "is_sqlite", lambda: True)
														
 
															+    monkeypatch.setattr(db_dialect, "is_postgres", lambda: False)
														
 
															+    from backend.app.core import database as database_module
														
 
															+
														
 
															+    monkeypatch.setattr(database_module, "is_sqlite", lambda: True)
														
 
															+
														
 
															+
														
 
															+def _register_all_models():
														
 
															+    """Import every model so Base.metadata knows the full schema."""
														
 
															+    from backend.app.models import (  # noqa: F401
														
 
															+        ams_history,
														
 
															+        ams_label,
														
 
															+        api_key,
														
 
															+        archive,
														
 
															+        color_catalog,
														
 
															+        external_link,
														
 
															+        filament,
														
 
															+        group,
														
 
															+        kprofile_note,
														
 
															+        maintenance,
														
 
															+        notification,
														
 
															+        notification_template,
														
 
															+        print_log,
														
 
															+        print_queue,
														
 
															+        printer,
														
 
															+        project,
														
 
															+        project_bom,
														
 
															+        settings,
														
 
															+        slot_preset,
														
 
															+        smart_plug,
														
 
															+        smart_plug_energy_snapshot,
														
 
															+        spool,
														
 
															+        spool_assignment,
														
 
															+        spool_catalog,
														
 
															+        spool_k_profile,
														
 
															+        spool_usage_history,
														
 
															+        spoolbuddy_device,
														
 
															+        user,
														
 
															+        user_email_pref,
														
 
															+        virtual_printer,
														
 
															+    )
														
 
															+
														
 
															+
														
 
															+@pytest.fixture
														
 
															+async def engine_with_legacy_data():
														
 
															+    """Fresh schema + a legacy-shape dataset: two archives, four PrintLogEntry
														
 
															+    rows. The cube.3mf archive carries cost+energy (the user's reprinted file);
														
 
															+    gear.3mf has neither set. Three matching log entries simulate cube's
														
 
															+    reprint history (status: failed → completed → completed). All log entries
														
 
															+    start with archive_id and cost = NULL, exactly like the column-add
														
 
															+    migration leaves on a pre-#1378 install."""
														
 
															+    from sqlalchemy.ext.asyncio import async_sessionmaker
														
 
															+
														
 
															+    from backend.app.core.database import Base
														
 
															+    from backend.app.models.archive import PrintArchive
														
 
															+
														
 
															+    _register_all_models()
														
 
															+
														
 
															+    engine = create_async_engine("sqlite+aiosqlite:///:memory:", echo=False)
														
 
															+    async with engine.begin() as conn:
														
 
															+        await conn.run_sync(Base.metadata.create_all)
														
 
															+
														
 
															+    SessionLocal = async_sessionmaker(engine, expire_on_commit=False)
														
 
															+    async with SessionLocal() as session:
														
 
															+        session.add(
														
 
															+            PrintArchive(
														
 
															+                id=1,
														
 
															+                filename="cube.3mf",
														
 
															+                file_path="/x/cube.3mf",
														
 
															+                file_size=100,
														
 
															+                print_name="cube.3mf",
														
 
															+                printer_id=1,
														
 
															+                cost=4.25,
														
 
															+                energy_kwh=0.42,
														
 
															+                energy_cost=0.063,
														
 
															+                status="completed",
														
 
															+            )
														
 
															+        )
														
 
															+        session.add(
														
 
															+            PrintArchive(
														
 
															+                id=2,
														
 
															+                filename="gear.3mf",
														
 
															+                file_path="/x/gear.3mf",
														
 
															+                file_size=100,
														
 
															+                print_name="gear.3mf",
														
 
															+                printer_id=1,
														
 
															+                status="completed",
														
 
															+            )
														
 
															+        )
														
 
															+        await session.commit()
														
 
															+
														
 
															+    async with engine.begin() as conn:
														
 
															+        # Three log entries for cube.3mf (two early reprints + a latest run),
														
 
															+        # one for gear.3mf. All with archive_id and cost NULL — exactly the
														
 
															+        # state the column-add migration leaves on pre-#1378 installs.
														
 
															+        base = datetime.now(timezone.utc) - timedelta(days=10)
														
 
															+        for i, (delta_days, status, print_name) in enumerate(
														
 
															+            [
														
 
															+                (0, "failed", "cube.3mf"),
														
 
															+                (1, "completed", "cube.3mf"),
														
 
															+                (2, "completed", "cube.3mf"),  # latest run for cube — must receive backfill
														
 
															+                (3, "completed", "gear.3mf"),
														
 
															+            ],
														
 
															+            start=1,
														
 
															+        ):
														
 
															+            ts = (base + timedelta(days=delta_days)).isoformat()
														
 
															+            await conn.execute(
														
 
															+                text("""
														
 
															+                    INSERT INTO print_log_entries
														
 
															+                        (id, print_name, printer_id, status, started_at, completed_at,
														
 
															+                         duration_seconds, filament_used_grams, created_at)
														
 
															+                    VALUES (:id, :pn, 1, :status, :ts, :ts, 3600, 25.0, :ts)
														
 
															+                """),
														
 
															+                {"id": i, "pn": print_name, "status": status, "ts": ts},
														
 
															+            )
														
 
															+
														
 
															+        # Force NULL on the columns we want the migration to touch — the
														
 
															+        # CREATE TABLE from Base.metadata.create_all already left them NULL,
														
 
															+        # but we set explicitly so the fixture's intent is loud.
														
 
															+        await conn.execute(
														
 
															+            text("UPDATE print_log_entries SET archive_id = NULL, cost = NULL, energy_kwh = NULL, energy_cost = NULL")
														
 
															+        )
														
 
															+
														
 
															+    yield engine
														
 
															+    await engine.dispose()
														
 
															+
														
 
															+
														
 
															+async def test_backfill_links_log_entries_to_their_archive(engine_with_legacy_data):
														
 
															+    """All four entries should pick up archive_id after the migration runs."""
														
 
															+    async with engine_with_legacy_data.begin() as conn:
														
 
															+        await run_migrations(conn)
														
 
															+
														
 
															+    async with engine_with_legacy_data.connect() as conn:
														
 
															+        result = await conn.execute(text("SELECT id, print_name, archive_id FROM print_log_entries ORDER BY id"))
														
 
															+        rows = result.all()
														
 
															+
														
 
															+    assert rows == [
														
 
															+        (1, "cube.3mf", 1),
														
 
															+        (2, "cube.3mf", 1),
														
 
															+        (3, "cube.3mf", 1),
														
 
															+        (4, "gear.3mf", 2),
														
 
															+    ]
														
 
															+
														
 
															+
														
 
															+async def test_backfill_copies_cost_and_energy_to_latest_run_only(engine_with_legacy_data):
														
 
															+    """Pre-#1378 archive.cost = LAST run's value because reprints overwrote it.
														
 
															+    The backfill attributes that cost to the latest matching log entry; earlier
														
 
															+    runs stay NULL so summing across runs reproduces sum-of-archive-costs
														
 
															+    exactly — what the user saw before the upgrade."""
														
 
															+    async with engine_with_legacy_data.begin() as conn:
														
 
															+        await run_migrations(conn)
														
 
															+
														
 
															+    async with engine_with_legacy_data.connect() as conn:
														
 
															+        result = await conn.execute(text("SELECT id, cost, energy_kwh, energy_cost FROM print_log_entries ORDER BY id"))
														
 
															+        rows = result.all()
														
 
															+
														
 
															+    # Two earlier cube runs (id 1, 2): cost stays NULL.
														
 
															+    assert rows[0] == (1, None, None, None)
														
 
															+    assert rows[1] == (2, None, None, None)
														
 
															+    # Latest cube run (id 3): receives archive 1's cost / energy.
														
 
															+    assert rows[2] == (3, 4.25, 0.42, 0.063)
														
 
															+    # gear run (id 4): archive 2 has no cost/energy so log stays NULL too.
														
 
															+    assert rows[3] == (4, None, None, None)
														
 
															+
														
 
															+
														
 
															+async def test_backfill_is_idempotent(engine_with_legacy_data):
														
 
															+    """Running the migration twice produces the same state — no double-backfill,
														
 
															+    no values pulled off rows the second pass would mistakenly treat as 'new'."""
														
 
															+    async with engine_with_legacy_data.begin() as conn:
														
 
															+        await run_migrations(conn)
														
 
															+    async with engine_with_legacy_data.begin() as conn:
														
 
															+        await run_migrations(conn)
														
 
															+
														
 
															+    async with engine_with_legacy_data.connect() as conn:
														
 
															+        result = await conn.execute(text("SELECT id, archive_id, cost FROM print_log_entries ORDER BY id"))
														
 
															+        rows = result.all()
														
 
															+
														
 
															+    assert rows == [
														
 
															+        (1, 1, None),
														
 
															+        (2, 1, None),
														
 
															+        (3, 1, 4.25),
														
 
															+        (4, 2, None),
														
 
															+    ]
														
 
															+
														
 
															+
														
 
															+async def test_backfill_skips_archives_with_any_costed_run(engine_with_legacy_data):
														
 
															+    """If ANY log entry for an archive already has cost set — e.g. the post-#1378
														
 
															+    live write path filled it for a new run — the backfill leaves the entire
														
 
															+    archive alone. This is the migration's idempotency anchor: 'cost is
														
 
															+    accounted for somewhere on this archive's history' is the signal we use
														
 
															+    to decide whether to inject the archive-level value. Backfilling another
														
 
															+    row would double-count once the live writes start adding up."""
														
 
															+    async with engine_with_legacy_data.begin() as conn:
														
 
															+        # Pretend run #1 was written post-fix with its own cost.
														
 
															+        await conn.execute(text("UPDATE print_log_entries SET cost = 1.11 WHERE id = 1"))
														
 
															+        await run_migrations(conn)
														
 
															+
														
 
															+    async with engine_with_legacy_data.connect() as conn:
														
 
															+        result = await conn.execute(text("SELECT id, cost FROM print_log_entries ORDER BY id"))
														
 
															+        rows = result.all()
														
 
															+
														
 
															+    # Run #1 keeps its live-written cost. The archive already has a costed
														
 
															+    # run, so the migration does NOT inject archive.cost onto run #3.
														
 
															+    # gear.3mf (archive 2) still has nothing — but archive.cost is NULL
														
 
															+    # there too, so the backfill UPDATE would set NULL → NULL anyway, which
														
 
															+    # is the desired no-op.
														
 
															+    assert dict(rows) == {1: 1.11, 2: None, 3: None, 4: None}