archive.py 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943
  1. import hashlib
  2. import json
  3. import re
  4. import shutil
  5. import zipfile
  6. from datetime import datetime
  7. from pathlib import Path
  8. from xml.etree import ElementTree as ET
  9. from sqlalchemy import and_, or_, select
  10. from sqlalchemy.ext.asyncio import AsyncSession
  11. from backend.app.core.config import settings
  12. from backend.app.models.archive import PrintArchive
  13. from backend.app.models.filament import Filament
  14. from backend.app.models.printer import Printer
  15. class ThreeMFParser:
  16. """Parser for Bambu Lab 3MF files."""
  17. def __init__(self, file_path: Path, plate_number: int | None = None):
  18. self.file_path = file_path
  19. self.plate_number = plate_number # Which plate was printed (1, 2, 3, etc.)
  20. self.metadata: dict = {}
  21. def parse(self) -> dict:
  22. """Extract metadata from 3MF file."""
  23. try:
  24. with zipfile.ZipFile(self.file_path, "r") as zf:
  25. self._parse_slice_info(zf)
  26. self._parse_project_settings(zf)
  27. self._parse_gcode_header(zf)
  28. self._parse_3dmodel(zf)
  29. self._extract_thumbnail(zf)
  30. # ALWAYS prefer slice_info values - they contain ONLY filaments actually used in print
  31. # project_settings contains ALL configured filaments (AMS slots), not just used ones
  32. if self.metadata.get("_slice_filament_type"):
  33. self.metadata["filament_type"] = self.metadata["_slice_filament_type"]
  34. if self.metadata.get("_slice_filament_color"):
  35. self.metadata["filament_color"] = self.metadata["_slice_filament_color"]
  36. # Clean up internal keys
  37. self.metadata.pop("_slice_filament_type", None)
  38. self.metadata.pop("_slice_filament_color", None)
  39. except Exception:
  40. pass
  41. return self.metadata
  42. def _parse_slice_info(self, zf: zipfile.ZipFile):
  43. """Parse slice_info.config for print settings and printable objects."""
  44. try:
  45. if "Metadata/slice_info.config" in zf.namelist():
  46. content = zf.read("Metadata/slice_info.config").decode()
  47. root = ET.fromstring(content)
  48. # Get the correct plate's metadata (use plate_number if specified)
  49. if self.plate_number:
  50. plate = root.find(f".//plate[@plate_idx='{self.plate_number}']")
  51. if plate is None:
  52. # Fallback to first plate if specific plate not found
  53. plate = root.find(".//plate")
  54. else:
  55. plate = root.find(".//plate")
  56. if plate is not None:
  57. # Get prediction and weight from metadata elements
  58. for meta in plate.findall("metadata"):
  59. key = meta.get("key")
  60. value = meta.get("value")
  61. if key == "prediction" and value:
  62. self.metadata["print_time_seconds"] = int(value)
  63. elif key == "weight" and value:
  64. self.metadata["filament_used_grams"] = float(value)
  65. # Extract printable objects for skip object functionality
  66. # Objects are stored as <object identify_id="123" name="Part1" skipped="false" />
  67. printable_objects = {}
  68. for obj in plate.findall("object"):
  69. identify_id = obj.get("identify_id")
  70. name = obj.get("name")
  71. skipped = obj.get("skipped", "false")
  72. # Only include objects that are not pre-skipped
  73. if identify_id and name and skipped.lower() != "true":
  74. try:
  75. printable_objects[int(identify_id)] = name
  76. except ValueError:
  77. pass
  78. if printable_objects:
  79. self.metadata["printable_objects"] = printable_objects
  80. # Get filament info from filaments ACTUALLY USED in the print
  81. # slice_info has <filament id="1" type="PLA" color="#FFFFFF" used_g="100" />
  82. # Only include filaments where used_g > 0
  83. filaments = root.findall(".//filament")
  84. if filaments:
  85. # Collect unique filament types and colors for filaments that are actually used
  86. types = []
  87. colors = []
  88. for f in filaments:
  89. # Check if this filament is actually used in the print
  90. used_g = f.get("used_g", "0")
  91. try:
  92. used_amount = float(used_g)
  93. except (ValueError, TypeError):
  94. used_amount = 0
  95. # Only include if used_g > 0 (filament is actually consumed)
  96. if used_amount > 0:
  97. ftype = f.get("type")
  98. fcolor = f.get("color")
  99. if ftype and ftype not in types:
  100. types.append(ftype)
  101. if fcolor and fcolor not in colors:
  102. colors.append(fcolor)
  103. if types:
  104. self.metadata["_slice_filament_type"] = ", ".join(types)
  105. if colors:
  106. self.metadata["_slice_filament_color"] = ",".join(colors)
  107. except Exception:
  108. pass
  109. def _parse_project_settings(self, zf: zipfile.ZipFile):
  110. """Parse project settings for print configuration."""
  111. try:
  112. if "Metadata/project_settings.config" in zf.namelist():
  113. content = zf.read("Metadata/project_settings.config").decode()
  114. try:
  115. data = json.loads(content)
  116. self._extract_filament_info(data)
  117. self._extract_print_settings(data)
  118. except json.JSONDecodeError:
  119. pass
  120. except Exception:
  121. pass
  122. def _parse_gcode_header(self, zf: zipfile.ZipFile):
  123. """Parse G-code file header for total layer count."""
  124. import re
  125. try:
  126. # Look for plate_1.gcode or similar
  127. gcode_files = [f for f in zf.namelist() if f.endswith(".gcode")]
  128. if not gcode_files:
  129. return
  130. # Read first 2KB of G-code (header contains the layer count)
  131. gcode_path = gcode_files[0]
  132. with zf.open(gcode_path) as f:
  133. header = f.read(2048).decode("utf-8", errors="ignore")
  134. # Look for "; total layer number: XX" pattern
  135. match = re.search(r";\s*total\s+layer\s+number[:\s]+(\d+)", header, re.IGNORECASE)
  136. if match:
  137. self.metadata["total_layers"] = int(match.group(1))
  138. except Exception:
  139. pass
  140. def _extract_filament_info(self, data: dict):
  141. """Extract filament info, preferring non-support filaments."""
  142. try:
  143. filament_types = data.get("filament_type", [])
  144. filament_colors = data.get("filament_colour", [])
  145. filament_is_support = data.get("filament_is_support", [])
  146. if not filament_types:
  147. return
  148. # Collect all non-support filaments
  149. non_support_types = []
  150. non_support_colors = []
  151. for i, ftype in enumerate(filament_types):
  152. is_support = filament_is_support[i] if i < len(filament_is_support) else "0"
  153. if is_support == "0":
  154. if ftype and ftype not in non_support_types:
  155. non_support_types.append(ftype)
  156. if i < len(filament_colors) and filament_colors[i]:
  157. color = filament_colors[i]
  158. if color not in non_support_colors:
  159. non_support_colors.append(color)
  160. # Fallback to first filament if all are support
  161. if not non_support_types and filament_types:
  162. non_support_types = [filament_types[0]]
  163. if not non_support_colors and filament_colors:
  164. non_support_colors = [filament_colors[0]]
  165. # Store filament type(s)
  166. if non_support_types:
  167. self.metadata["filament_type"] = ", ".join(non_support_types)
  168. # Store all colors as comma-separated (for multi-color display)
  169. if non_support_colors:
  170. self.metadata["filament_color"] = ",".join(non_support_colors)
  171. except Exception:
  172. pass
  173. def _extract_print_settings(self, data: dict):
  174. """Extract print settings from JSON config."""
  175. try:
  176. # Layer height - usually an array, get first value
  177. if "layer_height" in data:
  178. val = data["layer_height"]
  179. if isinstance(val, list) and val:
  180. self.metadata["layer_height"] = float(val[0])
  181. elif isinstance(val, (int, float, str)):
  182. self.metadata["layer_height"] = float(val)
  183. # Nozzle diameter
  184. if "nozzle_diameter" in data:
  185. val = data["nozzle_diameter"]
  186. if isinstance(val, list) and val:
  187. self.metadata["nozzle_diameter"] = float(val[0])
  188. elif isinstance(val, (int, float, str)):
  189. self.metadata["nozzle_diameter"] = float(val)
  190. # Bed temperature - first layer or regular
  191. for key in ["bed_temperature_initial_layer", "bed_temperature"]:
  192. if key in data:
  193. val = data[key]
  194. if isinstance(val, list) and val:
  195. self.metadata["bed_temperature"] = int(float(val[0]))
  196. elif isinstance(val, (int, float, str)):
  197. self.metadata["bed_temperature"] = int(float(val))
  198. break
  199. # Nozzle temperature
  200. for key in ["nozzle_temperature_initial_layer", "nozzle_temperature"]:
  201. if key in data:
  202. val = data[key]
  203. if isinstance(val, list) and val:
  204. self.metadata["nozzle_temperature"] = int(float(val[0]))
  205. elif isinstance(val, (int, float, str)):
  206. self.metadata["nozzle_temperature"] = int(float(val))
  207. break
  208. except Exception:
  209. pass
  210. def _extract_settings_from_content(self, content: str):
  211. """Extract print settings from config content."""
  212. settings_map = {
  213. "layer_height": ("layer_height", float),
  214. "nozzle_diameter": ("nozzle_diameter", float),
  215. "bed_temperature": ("bed_temperature", int),
  216. "nozzle_temperature": ("nozzle_temperature", int),
  217. }
  218. for key, (search_key, converter) in settings_map.items():
  219. if key not in self.metadata:
  220. try:
  221. # Try JSON format
  222. if f'"{search_key}"' in content:
  223. start = content.find(f'"{search_key}"')
  224. value_start = content.find(":", start) + 1
  225. value_end = content.find(",", value_start)
  226. if value_end == -1:
  227. value_end = content.find("}", value_start)
  228. value = content[value_start:value_end].strip().strip('"')
  229. self.metadata[key] = converter(value)
  230. except Exception:
  231. pass
  232. def _parse_3dmodel(self, zf: zipfile.ZipFile):
  233. """Parse 3D/3dmodel.model for MakerWorld metadata."""
  234. import re
  235. try:
  236. model_path = "3D/3dmodel.model"
  237. if model_path not in zf.namelist():
  238. return
  239. content = zf.read(model_path).decode("utf-8", errors="ignore")
  240. # Parse XML metadata elements
  241. # MakerWorld adds metadata like: <metadata name="Designer">username</metadata>
  242. metadata_pattern = r'<metadata\s+name="([^"]+)"[^>]*>([^<]*)</metadata>'
  243. matches = re.findall(metadata_pattern, content)
  244. makerworld_fields = {}
  245. for name, value in matches:
  246. makerworld_fields[name] = value.strip()
  247. # Check for direct MakerWorld URL in content
  248. url_pattern = r'https?://makerworld\.com/[^\s<>"\']+/models/(\d+)'
  249. url_match = re.search(url_pattern, content)
  250. if url_match:
  251. self.metadata["makerworld_url"] = url_match.group(0)
  252. self.metadata["makerworld_model_id"] = url_match.group(1)
  253. # Extract model ID from DSM reference in image URLs
  254. # Format: https://makerworld.bblmw.com/makerworld/model/DSM00000001275614/...
  255. # The numeric part (1275614) is the MakerWorld model ID
  256. if "makerworld_url" not in self.metadata:
  257. dsm_pattern = r"DSM0+(\d+)"
  258. dsm_match = re.search(dsm_pattern, content)
  259. if dsm_match:
  260. model_id = dsm_match.group(1)
  261. self.metadata["makerworld_url"] = f"https://makerworld.com/en/models/{model_id}"
  262. self.metadata["makerworld_model_id"] = model_id
  263. # Store designer info
  264. if "Designer" in makerworld_fields:
  265. self.metadata["designer"] = makerworld_fields["Designer"]
  266. if "Title" in makerworld_fields:
  267. self.metadata["print_name"] = makerworld_fields["Title"]
  268. except Exception:
  269. pass
  270. def _extract_thumbnail(self, zf: zipfile.ZipFile):
  271. """Extract thumbnail image from 3MF.
  272. If a plate_number was specified, try to use that plate's thumbnail first.
  273. """
  274. thumbnail_paths = []
  275. # If a specific plate was printed, try that thumbnail first
  276. if self.plate_number:
  277. thumbnail_paths.append(f"Metadata/plate_{self.plate_number}.png")
  278. # Fallback to default paths
  279. thumbnail_paths.extend(
  280. [
  281. "Metadata/plate_1.png",
  282. "Metadata/thumbnail.png",
  283. "Metadata/model_thumbnail.png",
  284. ]
  285. )
  286. for thumb_path in thumbnail_paths:
  287. if thumb_path in zf.namelist():
  288. self.metadata["_thumbnail_data"] = zf.read(thumb_path)
  289. self.metadata["_thumbnail_ext"] = ".png"
  290. break
  291. def extract_printable_objects_from_3mf(
  292. data: bytes, plate_number: int | None = None, include_positions: bool = False
  293. ) -> dict[int, str] | dict[int, dict]:
  294. """Extract printable objects from 3MF file bytes.
  295. This is a lightweight function used during print start to get the list
  296. of objects that can be skipped.
  297. Args:
  298. data: Raw bytes of the 3MF file
  299. plate_number: Which plate was printed (1-based), or None for first plate
  300. include_positions: If True, return dict with name and position info
  301. Returns:
  302. If include_positions=False: Dictionary mapping identify_id (int) to object name (str)
  303. If include_positions=True: Dictionary mapping identify_id to {name, x, y} dict
  304. """
  305. import json
  306. from io import BytesIO
  307. printable_objects: dict = {}
  308. try:
  309. with zipfile.ZipFile(BytesIO(data), "r") as zf:
  310. if "Metadata/slice_info.config" not in zf.namelist():
  311. return printable_objects
  312. content = zf.read("Metadata/slice_info.config").decode()
  313. root = ET.fromstring(content)
  314. # Find the correct plate
  315. plate_idx = plate_number or 1
  316. if plate_number:
  317. plate = root.find(f".//plate[@plate_idx='{plate_number}']")
  318. if plate is None:
  319. plate = root.find(".//plate")
  320. else:
  321. plate = root.find(".//plate")
  322. if plate is None:
  323. return printable_objects
  324. # Load position data from plate_N.json if we need positions
  325. bbox_objects = []
  326. if include_positions:
  327. plate_json_path = f"Metadata/plate_{plate_idx}.json"
  328. if plate_json_path in zf.namelist():
  329. try:
  330. plate_json = json.loads(zf.read(plate_json_path).decode())
  331. bbox_objects = plate_json.get("bbox_objects", [])
  332. except (json.JSONDecodeError, KeyError):
  333. pass
  334. # Extract objects from slice_info.config
  335. objects_list = []
  336. for obj in plate.findall("object"):
  337. identify_id = obj.get("identify_id")
  338. name = obj.get("name")
  339. skipped = obj.get("skipped", "false")
  340. if identify_id and name and skipped.lower() != "true":
  341. try:
  342. obj_id = int(identify_id)
  343. objects_list.append((obj_id, name))
  344. except ValueError:
  345. pass
  346. # Match objects with positions by index (both lists are in same order)
  347. for idx, (obj_id, name) in enumerate(objects_list):
  348. if include_positions:
  349. x, y = None, None
  350. if idx < len(bbox_objects):
  351. bbox = bbox_objects[idx].get("bbox", [])
  352. if len(bbox) >= 4:
  353. # Calculate center from bbox [x_min, y_min, x_max, y_max]
  354. x = (bbox[0] + bbox[2]) / 2
  355. y = (bbox[1] + bbox[3]) / 2
  356. printable_objects[obj_id] = {"name": name, "x": x, "y": y}
  357. else:
  358. printable_objects[obj_id] = name
  359. except Exception:
  360. pass
  361. return printable_objects
  362. class ProjectPageParser:
  363. """Parser for extracting project page data from Bambu Lab 3MF files."""
  364. def __init__(self, file_path: Path):
  365. self.file_path = file_path
  366. def parse(self, archive_id: int) -> dict:
  367. """Extract project page metadata and images from 3MF file."""
  368. import html
  369. import re
  370. result = {
  371. "title": None,
  372. "description": None,
  373. "designer": None,
  374. "designer_user_id": None,
  375. "license": None,
  376. "copyright": None,
  377. "creation_date": None,
  378. "modification_date": None,
  379. "origin": None,
  380. "profile_title": None,
  381. "profile_description": None,
  382. "profile_cover": None,
  383. "profile_user_id": None,
  384. "profile_user_name": None,
  385. "design_model_id": None,
  386. "design_profile_id": None,
  387. "design_region": None,
  388. "model_pictures": [],
  389. "profile_pictures": [],
  390. "thumbnails": [],
  391. }
  392. try:
  393. with zipfile.ZipFile(self.file_path, "r") as zf:
  394. # Parse 3D/3dmodel.model for metadata
  395. model_path = "3D/3dmodel.model"
  396. if model_path in zf.namelist():
  397. content = zf.read(model_path).decode("utf-8", errors="ignore")
  398. # Extract metadata elements using regex
  399. # Format: <metadata name="Key">Value</metadata> or <metadata name="Key" />
  400. metadata_pattern = r'<metadata\s+name="([^"]+)"[^>]*>([^<]*)</metadata>'
  401. matches = re.findall(metadata_pattern, content)
  402. field_mapping = {
  403. "Title": "title",
  404. "Description": "description",
  405. "Designer": "designer",
  406. "DesignerUserId": "designer_user_id",
  407. "License": "license",
  408. "Copyright": "copyright",
  409. "CreationDate": "creation_date",
  410. "ModificationDate": "modification_date",
  411. "Origin": "origin",
  412. "ProfileTitle": "profile_title",
  413. "ProfileDescription": "profile_description",
  414. "ProfileCover": "profile_cover",
  415. "ProfileUserId": "profile_user_id",
  416. "ProfileUserName": "profile_user_name",
  417. "DesignModelId": "design_model_id",
  418. "DesignProfileId": "design_profile_id",
  419. "DesignRegion": "design_region",
  420. }
  421. for name, value in matches:
  422. if name in field_mapping:
  423. # Decode HTML entities multiple times (content is often triple-encoded)
  424. decoded = value.strip()
  425. prev = None
  426. while prev != decoded:
  427. prev = decoded
  428. decoded = html.unescape(decoded)
  429. # Normalize non-breaking spaces to regular spaces
  430. decoded = decoded.replace("\xa0", " ")
  431. result[field_mapping[name]] = decoded if decoded else None
  432. # List images in Auxiliaries folder
  433. from urllib.parse import quote
  434. for name in zf.namelist():
  435. if name.startswith("Auxiliaries/Model Pictures/"):
  436. filename = name.split("/")[-1]
  437. if filename:
  438. result["model_pictures"].append(
  439. {
  440. "name": filename,
  441. "path": name,
  442. "url": f"/api/v1/archives/{archive_id}/project-image/{quote(name, safe='')}",
  443. }
  444. )
  445. elif name.startswith("Auxiliaries/Profile Pictures/"):
  446. filename = name.split("/")[-1]
  447. if filename:
  448. result["profile_pictures"].append(
  449. {
  450. "name": filename,
  451. "path": name,
  452. "url": f"/api/v1/archives/{archive_id}/project-image/{quote(name, safe='')}",
  453. }
  454. )
  455. elif name.startswith("Auxiliaries/.thumbnails/"):
  456. filename = name.split("/")[-1]
  457. if filename:
  458. result["thumbnails"].append(
  459. {
  460. "name": filename,
  461. "path": name,
  462. "url": f"/api/v1/archives/{archive_id}/project-image/{quote(name, safe='')}",
  463. }
  464. )
  465. except Exception as e:
  466. result["_error"] = str(e)
  467. return result
  468. def get_image(self, image_path: str) -> tuple[bytes, str] | None:
  469. """Extract an image from the 3MF file.
  470. Returns tuple of (image_data, content_type) or None if not found.
  471. """
  472. try:
  473. with zipfile.ZipFile(self.file_path, "r") as zf:
  474. if image_path in zf.namelist():
  475. data = zf.read(image_path)
  476. # Determine content type from extension
  477. ext = image_path.lower().split(".")[-1]
  478. content_types = {
  479. "png": "image/png",
  480. "jpg": "image/jpeg",
  481. "jpeg": "image/jpeg",
  482. "webp": "image/webp",
  483. "gif": "image/gif",
  484. }
  485. content_type = content_types.get(ext, "application/octet-stream")
  486. return (data, content_type)
  487. except Exception:
  488. pass
  489. return None
  490. def update_metadata(self, updates: dict) -> bool:
  491. """Update project page metadata in the 3MF file.
  492. Args:
  493. updates: Dict with fields to update (title, description, designer, etc.)
  494. Returns:
  495. True if successful, False otherwise.
  496. """
  497. import html
  498. import re
  499. import tempfile
  500. try:
  501. # Read the 3MF file
  502. with zipfile.ZipFile(self.file_path, "r") as zf_read:
  503. # Find and read the 3dmodel.model file
  504. model_path = "3D/3dmodel.model"
  505. if model_path not in zf_read.namelist():
  506. return False
  507. content = zf_read.read(model_path).decode("utf-8")
  508. # Update metadata fields
  509. field_mapping = {
  510. "title": "Title",
  511. "description": "Description",
  512. "designer": "Designer",
  513. "license": "License",
  514. "copyright": "Copyright",
  515. "profile_title": "ProfileTitle",
  516. "profile_description": "ProfileDescription",
  517. }
  518. for field, xml_name in field_mapping.items():
  519. if field in updates and updates[field] is not None:
  520. new_value = html.escape(updates[field])
  521. # Replace existing metadata or we'd need to add it
  522. pattern = rf'(<metadata\s+name="{xml_name}"[^>]*>)[^<]*(</metadata>)'
  523. replacement = rf"\g<1>{new_value}\g<2>"
  524. content = re.sub(pattern, replacement, content)
  525. # Write to a temporary file first
  526. with tempfile.NamedTemporaryFile(delete=False, suffix=".3mf") as tmp:
  527. tmp_path = Path(tmp.name)
  528. # Create new zip with updated content
  529. with zipfile.ZipFile(tmp_path, "w", zipfile.ZIP_DEFLATED) as zf_write:
  530. for item in zf_read.namelist():
  531. if item == model_path:
  532. zf_write.writestr(item, content.encode("utf-8"))
  533. else:
  534. zf_write.writestr(item, zf_read.read(item))
  535. # Replace original file with updated one
  536. shutil.move(tmp_path, self.file_path)
  537. return True
  538. except Exception:
  539. # Clean up temp file if it exists
  540. if "tmp_path" in locals() and tmp_path.exists():
  541. tmp_path.unlink()
  542. return False
  543. class ArchiveService:
  544. """Service for archiving print jobs."""
  545. def __init__(self, db: AsyncSession):
  546. self.db = db
  547. @staticmethod
  548. def compute_file_hash(file_path: Path) -> str:
  549. """Compute SHA256 hash of a file for duplicate detection."""
  550. sha256 = hashlib.sha256()
  551. with open(file_path, "rb") as f:
  552. # Read in chunks to handle large files
  553. for chunk in iter(lambda: f.read(8192), b""):
  554. sha256.update(chunk)
  555. return sha256.hexdigest()
  556. async def get_duplicate_hashes(self) -> set[str]:
  557. """Get all content hashes that appear more than once.
  558. Returns a set of hashes that have duplicates.
  559. """
  560. from sqlalchemy import func
  561. result = await self.db.execute(
  562. select(PrintArchive.content_hash)
  563. .where(PrintArchive.content_hash.isnot(None))
  564. .group_by(PrintArchive.content_hash)
  565. .having(func.count(PrintArchive.id) > 1)
  566. )
  567. return {row[0] for row in result.all()}
  568. async def find_duplicates(
  569. self,
  570. archive_id: int,
  571. content_hash: str | None = None,
  572. print_name: str | None = None,
  573. makerworld_model_id: str | None = None,
  574. ) -> list[dict]:
  575. """Find duplicate archives based on hash or name matching.
  576. Returns list of dicts with id, print_name, created_at, match_type.
  577. """
  578. duplicates = []
  579. # First, find exact matches by content hash
  580. if content_hash:
  581. result = await self.db.execute(
  582. select(PrintArchive)
  583. .where(
  584. and_(
  585. PrintArchive.content_hash == content_hash,
  586. PrintArchive.id != archive_id,
  587. )
  588. )
  589. .order_by(PrintArchive.created_at.desc())
  590. .limit(10)
  591. )
  592. for archive in result.scalars().all():
  593. duplicates.append(
  594. {
  595. "id": archive.id,
  596. "print_name": archive.print_name,
  597. "created_at": archive.created_at,
  598. "match_type": "exact",
  599. }
  600. )
  601. # Then, find similar matches by print name or MakerWorld ID
  602. if print_name or makerworld_model_id:
  603. conditions = [PrintArchive.id != archive_id]
  604. name_conditions = []
  605. if print_name:
  606. # Match if print names are similar (ignoring case)
  607. name_conditions.append(PrintArchive.print_name.ilike(print_name))
  608. if makerworld_model_id:
  609. # Match by MakerWorld model ID stored in extra_data
  610. # Use json_extract for SQLite compatibility (astext is PostgreSQL-only)
  611. from sqlalchemy import func
  612. name_conditions.append(
  613. func.json_extract(PrintArchive.extra_data, "$.makerworld_model_id") == str(makerworld_model_id)
  614. )
  615. if name_conditions:
  616. conditions.append(or_(*name_conditions))
  617. result = await self.db.execute(
  618. select(PrintArchive).where(and_(*conditions)).order_by(PrintArchive.created_at.desc()).limit(10)
  619. )
  620. for archive in result.scalars().all():
  621. # Don't add if already in duplicates (exact match)
  622. if not any(d["id"] == archive.id for d in duplicates):
  623. duplicates.append(
  624. {
  625. "id": archive.id,
  626. "print_name": archive.print_name,
  627. "created_at": archive.created_at,
  628. "match_type": "similar",
  629. }
  630. )
  631. return duplicates
  632. async def archive_print(
  633. self,
  634. printer_id: int | None,
  635. source_file: Path,
  636. print_data: dict | None = None,
  637. ) -> PrintArchive | None:
  638. """Archive a 3MF file with metadata."""
  639. # Verify printer exists if specified
  640. if printer_id is not None:
  641. result = await self.db.execute(select(Printer).where(Printer.id == printer_id))
  642. printer = result.scalar_one_or_none()
  643. if not printer:
  644. return None
  645. # Create archive directory structure
  646. timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
  647. archive_name = f"{timestamp}_{source_file.stem}"
  648. # Use "unassigned" folder for archives without a printer
  649. printer_folder = str(printer_id) if printer_id is not None else "unassigned"
  650. archive_dir = settings.archive_dir / printer_folder / archive_name
  651. archive_dir.mkdir(parents=True, exist_ok=True)
  652. # Copy 3MF file
  653. dest_file = archive_dir / source_file.name
  654. shutil.copy2(source_file, dest_file)
  655. # Compute content hash for duplicate detection
  656. content_hash = self.compute_file_hash(dest_file)
  657. # Extract plate number from filename (e.g., "plate_5" from "/data/Metadata/plate_5.gcode")
  658. plate_number = None
  659. if print_data:
  660. filename = print_data.get("filename", "")
  661. match = re.search(r"plate_(\d+)", filename)
  662. if match:
  663. plate_number = int(match.group(1))
  664. # Parse 3MF metadata
  665. parser = ThreeMFParser(dest_file, plate_number=plate_number)
  666. metadata = parser.parse()
  667. # Save thumbnail if present
  668. thumbnail_path = None
  669. if "_thumbnail_data" in metadata:
  670. thumb_file = archive_dir / f"thumbnail{metadata['_thumbnail_ext']}"
  671. thumb_file.write_bytes(metadata["_thumbnail_data"])
  672. thumbnail_path = str(thumb_file.relative_to(settings.base_dir))
  673. del metadata["_thumbnail_data"]
  674. del metadata["_thumbnail_ext"]
  675. # Merge with print data from MQTT
  676. if print_data:
  677. metadata["_print_data"] = print_data
  678. # Determine status and timestamps
  679. status = print_data.get("status", "completed") if print_data else "archived"
  680. started_at = datetime.now() if status == "printing" else None
  681. completed_at = datetime.now() if status in ("completed", "failed", "archived") else None
  682. # Calculate cost based on filament usage and type
  683. cost = None
  684. filament_grams = metadata.get("filament_used_grams")
  685. filament_type = metadata.get("filament_type")
  686. if filament_grams and filament_type:
  687. # For multi-material prints, use the first filament type for cost calculation
  688. primary_type = filament_type.split(",")[0].strip()
  689. # Look up filament cost_per_kg from database
  690. filament_result = await self.db.execute(select(Filament).where(Filament.type == primary_type).limit(1))
  691. filament = filament_result.scalar_one_or_none()
  692. if filament:
  693. cost = round((filament_grams / 1000) * filament.cost_per_kg, 2)
  694. else:
  695. # Default cost_per_kg if filament type not found
  696. default_cost_per_kg = 25.0
  697. cost = round((filament_grams / 1000) * default_cost_per_kg, 2)
  698. # Create archive record
  699. archive = PrintArchive(
  700. printer_id=printer_id,
  701. filename=source_file.name,
  702. file_path=str(dest_file.relative_to(settings.base_dir)),
  703. file_size=dest_file.stat().st_size,
  704. content_hash=content_hash,
  705. thumbnail_path=thumbnail_path,
  706. print_name=metadata.get("print_name") or source_file.stem,
  707. print_time_seconds=metadata.get("print_time_seconds"),
  708. filament_used_grams=metadata.get("filament_used_grams"),
  709. filament_type=metadata.get("filament_type"),
  710. filament_color=metadata.get("filament_color"),
  711. layer_height=metadata.get("layer_height"),
  712. total_layers=metadata.get("total_layers"),
  713. nozzle_diameter=metadata.get("nozzle_diameter"),
  714. bed_temperature=metadata.get("bed_temperature"),
  715. nozzle_temperature=metadata.get("nozzle_temperature"),
  716. makerworld_url=metadata.get("makerworld_url"),
  717. designer=metadata.get("designer"),
  718. status=status,
  719. started_at=started_at,
  720. completed_at=completed_at,
  721. cost=cost,
  722. extra_data=metadata,
  723. )
  724. self.db.add(archive)
  725. await self.db.commit()
  726. await self.db.refresh(archive)
  727. return archive
  728. async def get_archive(self, archive_id: int) -> PrintArchive | None:
  729. """Get an archive by ID."""
  730. result = await self.db.execute(select(PrintArchive).where(PrintArchive.id == archive_id))
  731. return result.scalar_one_or_none()
  732. async def update_archive_status(
  733. self,
  734. archive_id: int,
  735. status: str,
  736. completed_at: datetime | None = None,
  737. failure_reason: str | None = None,
  738. ) -> bool:
  739. """Update the status of an archive."""
  740. archive = await self.get_archive(archive_id)
  741. if not archive:
  742. return False
  743. archive.status = status
  744. if completed_at:
  745. archive.completed_at = completed_at
  746. if failure_reason:
  747. archive.failure_reason = failure_reason
  748. await self.db.commit()
  749. return True
  750. async def list_archives(
  751. self,
  752. printer_id: int | None = None,
  753. project_id: int | None = None,
  754. limit: int = 50,
  755. offset: int = 0,
  756. ) -> list[PrintArchive]:
  757. """List archives with optional filtering."""
  758. from sqlalchemy.orm import selectinload
  759. query = (
  760. select(PrintArchive).options(selectinload(PrintArchive.project)).order_by(PrintArchive.created_at.desc())
  761. )
  762. if printer_id:
  763. query = query.where(PrintArchive.printer_id == printer_id)
  764. if project_id:
  765. query = query.where(PrintArchive.project_id == project_id)
  766. query = query.limit(limit).offset(offset)
  767. result = await self.db.execute(query)
  768. return list(result.scalars().all())
  769. async def delete_archive(self, archive_id: int) -> bool:
  770. """Delete an archive and its files."""
  771. archive = await self.get_archive(archive_id)
  772. if not archive:
  773. return False
  774. # Delete files
  775. file_path = settings.base_dir / archive.file_path
  776. if file_path.exists():
  777. archive_dir = file_path.parent
  778. shutil.rmtree(archive_dir, ignore_errors=True)
  779. # Delete database record
  780. await self.db.delete(archive)
  781. await self.db.commit()
  782. return True
  783. async def attach_timelapse(
  784. self,
  785. archive_id: int,
  786. timelapse_data: bytes,
  787. filename: str = "timelapse.mp4",
  788. ) -> bool:
  789. """Attach a timelapse video to an archive."""
  790. import asyncio
  791. archive = await self.get_archive(archive_id)
  792. if not archive:
  793. return False
  794. # Get archive directory
  795. file_path = settings.base_dir / archive.file_path
  796. archive_dir = file_path.parent
  797. # Save timelapse - use thread pool to avoid blocking event loop
  798. # (timelapse files can be 100MB+, sync write blocks for seconds)
  799. timelapse_file = archive_dir / filename
  800. await asyncio.to_thread(timelapse_file.write_bytes, timelapse_data)
  801. # Update archive record
  802. archive.timelapse_path = str(timelapse_file.relative_to(settings.base_dir))
  803. await self.db.commit()
  804. return True