| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207 |
- from collections import defaultdict
- from datetime import date, datetime, time, timedelta, timezone
- from sqlalchemy import and_, func, select
- from sqlalchemy.ext.asyncio import AsyncSession
- from backend.app.models.archive import PrintArchive
- from backend.app.models.printer import Printer
- class FailureAnalysisService:
- """Service for analyzing print failure patterns."""
- def __init__(self, db: AsyncSession):
- self.db = db
- async def analyze_failures(
- self,
- days: int | None = None,
- date_from: date | None = None,
- date_to: date | None = None,
- printer_id: int | None = None,
- project_id: int | None = None,
- ) -> dict:
- """Analyze failure patterns across archives.
- Args:
- days: Number of days to analyze (fallback when no date range)
- date_from: Start date filter (inclusive)
- date_to: End date filter (inclusive)
- printer_id: Optional filter by printer
- project_id: Optional filter by project
- Returns:
- Dictionary with failure analysis results
- """
- # Build base query — separate date vs non-date filters for trend reuse
- base_filter = []
- non_date_filter = []
- if date_from or date_to:
- if date_from:
- dt_from = datetime.combine(date_from, time.min, tzinfo=timezone.utc)
- base_filter.append(PrintArchive.created_at >= dt_from)
- if date_to:
- dt_to = datetime.combine(date_to, time.max, tzinfo=timezone.utc)
- base_filter.append(PrintArchive.created_at <= dt_to)
- # Compute effective span for trend
- range_start = dt_from if date_from else datetime.now(timezone.utc) - timedelta(days=365)
- range_end = dt_to if date_to else datetime.now(timezone.utc)
- effective_days = max((range_end - range_start).days, 1)
- else:
- effective_days = days if days is not None else 30
- cutoff_date = datetime.now(timezone.utc) - timedelta(days=effective_days)
- base_filter.append(PrintArchive.created_at >= cutoff_date)
- if printer_id:
- non_date_filter.append(PrintArchive.printer_id == printer_id)
- if project_id:
- non_date_filter.append(PrintArchive.project_id == project_id)
- base_filter.extend(non_date_filter)
- # Total counts
- total_result = await self.db.execute(select(func.count(PrintArchive.id)).where(and_(*base_filter)))
- total_prints = total_result.scalar() or 0
- failed_result = await self.db.execute(
- select(func.count(PrintArchive.id)).where(
- and_(*base_filter, PrintArchive.status.in_(["failed", "aborted"]))
- )
- )
- failed_prints = failed_result.scalar() or 0
- failure_rate = (failed_prints / total_prints * 100) if total_prints > 0 else 0
- # Failures by reason
- reason_result = await self.db.execute(
- select(
- PrintArchive.failure_reason,
- func.count(PrintArchive.id).label("count"),
- )
- .where(and_(*base_filter, PrintArchive.status.in_(["failed", "aborted"])))
- .group_by(PrintArchive.failure_reason)
- .order_by(func.count(PrintArchive.id).desc())
- )
- failures_by_reason = {(row[0] or "Unknown"): row[1] for row in reason_result.fetchall()}
- # Failures by filament type
- filament_result = await self.db.execute(
- select(
- PrintArchive.filament_type,
- func.count(PrintArchive.id).label("count"),
- )
- .where(and_(*base_filter, PrintArchive.status.in_(["failed", "aborted"])))
- .group_by(PrintArchive.filament_type)
- .order_by(func.count(PrintArchive.id).desc())
- )
- failures_by_filament = {(row[0] or "Unknown"): row[1] for row in filament_result.fetchall()}
- # Failures by printer
- printer_result = await self.db.execute(
- select(
- PrintArchive.printer_id,
- func.count(PrintArchive.id).label("count"),
- )
- .where(
- and_(*base_filter, PrintArchive.status.in_(["failed", "aborted"]), PrintArchive.printer_id.isnot(None))
- )
- .group_by(PrintArchive.printer_id)
- .order_by(func.count(PrintArchive.id).desc())
- )
- failures_by_printer_id = {row[0]: row[1] for row in printer_result.fetchall()}
- # Get printer names
- if failures_by_printer_id:
- printers_result = await self.db.execute(
- select(Printer.id, Printer.name).where(Printer.id.in_(failures_by_printer_id.keys()))
- )
- printer_names = {row[0]: row[1] for row in printers_result.fetchall()}
- failures_by_printer = {
- printer_names.get(pid, f"Printer {pid}"): count for pid, count in failures_by_printer_id.items()
- }
- else:
- failures_by_printer = {}
- # Failures by hour of day
- failed_archives_result = await self.db.execute(
- select(PrintArchive.started_at).where(
- and_(
- *base_filter,
- PrintArchive.status.in_(["failed", "aborted"]),
- PrintArchive.started_at.isnot(None),
- )
- )
- )
- failures_by_hour = defaultdict(int)
- for (started_at,) in failed_archives_result.fetchall():
- if started_at:
- hour = started_at.hour
- failures_by_hour[hour] += 1
- # Convert to dict with all 24 hours
- failures_by_hour_complete = {h: failures_by_hour.get(h, 0) for h in range(24)}
- # Recent failures
- recent_result = await self.db.execute(
- select(PrintArchive)
- .where(and_(*base_filter, PrintArchive.status.in_(["failed", "aborted"])))
- .order_by(PrintArchive.created_at.desc())
- .limit(10)
- )
- recent_failures = [
- {
- "id": a.id,
- "print_name": a.print_name or a.filename,
- "failure_reason": a.failure_reason,
- "filament_type": a.filament_type,
- "printer_id": a.printer_id,
- "created_at": a.created_at.isoformat() if a.created_at else None,
- }
- for a in recent_result.scalars().all()
- ]
- # Failure rate trend (by week)
- trend_data = []
- num_weeks = max(effective_days // 7, 1)
- for i in range(num_weeks):
- week_end = datetime.now(timezone.utc) - timedelta(weeks=i)
- week_start = week_end - timedelta(weeks=1)
- week_filter = [
- PrintArchive.created_at >= week_start,
- PrintArchive.created_at < week_end,
- *non_date_filter,
- ]
- week_total = await self.db.execute(select(func.count(PrintArchive.id)).where(and_(*week_filter)))
- week_failed = await self.db.execute(
- select(func.count(PrintArchive.id)).where(
- and_(*week_filter, PrintArchive.status.in_(["failed", "aborted"]))
- )
- )
- total = week_total.scalar() or 0
- failed = week_failed.scalar() or 0
- rate = (failed / total * 100) if total > 0 else 0
- trend_data.append(
- {
- "week_start": week_start.date().isoformat(),
- "total_prints": total,
- "failed_prints": failed,
- "failure_rate": round(rate, 1),
- }
- )
- trend_data.reverse() # Oldest first
- return {
- "period_days": effective_days,
- "total_prints": total_prints,
- "failed_prints": failed_prints,
- "failure_rate": round(failure_rate, 1),
- "failures_by_reason": failures_by_reason,
- "failures_by_filament": failures_by_filament,
- "failures_by_printer": failures_by_printer,
- "failures_by_hour": failures_by_hour_complete,
- "recent_failures": recent_failures,
- "trend": trend_data,
- }
|