16 hodín pred · c127ce9407
--- a/official_script/nostradamus_importer.py
+++ b/official_script/nostradamus_importer.py
@@ -0,0 +1,658 @@
 
				+#!/usr/bin/env python3
			
 
				+"""Upload script for the Nostradamus session-based upload/import API.
			
 
				+
			
 
				+The local tool only:
			
 
				+- scans existing .torrent files and/or local data folders
			
 
				+- creates a new import session on Nostradamus
			
 
				+- uploads raw import candidates to that session
			
 
				+- prints the web URL where the uploader should review the items
			
 
				+"""
			
 
				+
			
 
				+from __future__ import annotations
			
 
				+
			
 
				+import argparse
			
 
				+import base64
			
 
				+import hashlib
			
 
				+import json
			
 
				+import secrets
			
 
				+import sys
			
 
				+import time
			
 
				+import urllib.error
			
 
				+import urllib.parse
			
 
				+import urllib.request
			
 
				+from dataclasses import dataclass
			
 
				+from pathlib import Path
			
 
				+from typing import Any, Dict, Iterable, List, Optional, Sequence, Tuple
			
 
				+
			
 
				+TEXT_EXTS = {".nfo", ".txt"}
			
 
				+DEFAULT_TIMEOUT = 30
			
 
				+DEFAULT_STATE_FILE = ".nostradamus-import-state.json"
			
 
				+
			
 
				+
			
 
				+@dataclass(frozen=True)
			
 
				+class RawBencoded:
			
 
				+    value: bytes
			
 
				+
			
 
				+
			
 
				+@dataclass
			
 
				+class ParsedTorrent:
			
 
				+    name: str
			
 
				+    info_hash: str
			
 
				+    size: int
			
 
				+    files: Dict[str, int]
			
 
				+    data: Dict[str, Any]
			
 
				+    binary: bytes
			
 
				+    info_raw: bytes
			
 
				+
			
 
				+
			
 
				+class Bencode:
			
 
				+    @staticmethod
			
 
				+    def decode_torrent(data: bytes) -> Tuple[Dict[str, Any], bytes]:
			
 
				+        if not data.startswith(b"d"):
			
 
				+            raise ValueError("torrent payload must be a bencoded dictionary")
			
 
				+
			
 
				+        index = 1
			
 
				+        result: Dict[str, Any] = {}
			
 
				+        info_raw: Optional[bytes] = None
			
 
				+
			
 
				+        while data[index:index + 1] != b"e":
			
 
				+            key_raw, index = Bencode._decode_bytes_at(data, index)
			
 
				+            value_start = index
			
 
				+            value, index = Bencode._decode_at(data, index)
			
 
				+            key = key_raw.decode("utf-8", errors="replace")
			
 
				+
			
 
				+            if key_raw == b"info":
			
 
				+                info_raw = data[value_start:index]
			
 
				+
			
 
				+            result[key] = value
			
 
				+
			
 
				+        if info_raw is None:
			
 
				+            raise ValueError("torrent missing info dictionary")
			
 
				+
			
 
				+        return result, info_raw
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def _decode_bytes_at(data: bytes, index: int) -> Tuple[bytes, int]:
			
 
				+        token = data[index:index + 1]
			
 
				+        if not token.isdigit():
			
 
				+            raise ValueError(f"invalid byte string token at {index}: {token!r}")
			
 
				+
			
 
				+        colon = data.index(b":", index)
			
 
				+        length = int(data[index:colon])
			
 
				+        start = colon + 1
			
 
				+        end = start + length
			
 
				+        return data[start:end], end
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def _decode_at(data: bytes, index: int) -> Tuple[Any, int]:
			
 
				+        token = data[index:index + 1]
			
 
				+        if token == b"i":
			
 
				+            end = data.index(b"e", index)
			
 
				+            return int(data[index + 1:end]), end + 1
			
 
				+        if token == b"l":
			
 
				+            index += 1
			
 
				+            items = []
			
 
				+            while data[index:index + 1] != b"e":
			
 
				+                item, index = Bencode._decode_at(data, index)
			
 
				+                items.append(item)
			
 
				+            return items, index + 1
			
 
				+        if token == b"d":
			
 
				+            index += 1
			
 
				+            result = {}
			
 
				+            while data[index:index + 1] != b"e":
			
 
				+                key, index = Bencode._decode_at(data, index)
			
 
				+                value, index = Bencode._decode_at(data, index)
			
 
				+                if isinstance(key, bytes):
			
 
				+                    key = key.decode("utf-8", errors="replace")
			
 
				+                result[key] = value
			
 
				+            return result, index + 1
			
 
				+        if token.isdigit():
			
 
				+            colon = data.index(b":", index)
			
 
				+            length = int(data[index:colon])
			
 
				+            start = colon + 1
			
 
				+            end = start + length
			
 
				+            raw = data[start:end]
			
 
				+            try:
			
 
				+                return raw.decode("utf-8"), end
			
 
				+            except UnicodeDecodeError:
			
 
				+                return raw, end
			
 
				+        raise ValueError(f"invalid bencode token at {index}: {token!r}")
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def encode(value: Any) -> bytes:
			
 
				+        if isinstance(value, RawBencoded):
			
 
				+            return value.value
			
 
				+        if isinstance(value, bool):
			
 
				+            value = int(value)
			
 
				+        if isinstance(value, int):
			
 
				+            return f"i{value}e".encode("ascii")
			
 
				+        if isinstance(value, bytes):
			
 
				+            return str(len(value)).encode("ascii") + b":" + value
			
 
				+        if isinstance(value, str):
			
 
				+            raw = value.encode("utf-8")
			
 
				+            return str(len(raw)).encode("ascii") + b":" + raw
			
 
				+        if isinstance(value, list):
			
 
				+            return b"l" + b"".join(Bencode.encode(item) for item in value) + b"e"
			
 
				+        if isinstance(value, dict):
			
 
				+            items = []
			
 
				+            for key in sorted(value.keys(), key=lambda item: item if isinstance(item, bytes) else str(item).encode("utf-8")):
			
 
				+                encoded_key = key if isinstance(key, bytes) else str(key)
			
 
				+                items.append(Bencode.encode(encoded_key))
			
 
				+                items.append(Bencode.encode(value[key]))
			
 
				+            return b"d" + b"".join(items) + b"e"
			
 
				+        raise TypeError(f"unsupported bencode type: {type(value)!r}")
			
 
				+
			
 
				+
			
 
				+class ImportUploader:
			
 
				+    def __init__(self, args: argparse.Namespace):
			
 
				+        self.args = args
			
 
				+        self.base_url = validate_base_url(args.base_url, args.allow_insecure_http)
			
 
				+        self.importer_token = args.importer_token
			
 
				+        self.timeout = args.timeout
			
 
				+        self.state_path = Path(args.state_file)
			
 
				+        self.state: Dict[str, Any] = {}
			
 
				+
			
 
				+    def run(self) -> int:
			
 
				+        candidates = self.collect_items()
			
 
				+        if not candidates:
			
 
				+            fatal("No import candidates found. Provide --torrent-root, --torrent, --data-root, or --path.")
			
 
				+
			
 
				+        mode = self.infer_mode(candidates)
			
 
				+        client_job_id = self.args.client_job_id or default_client_job_id()
			
 
				+
			
 
				+        info(f"Creating import session ({mode})")
			
 
				+        session = self.create_session(client_job_id, mode)
			
 
				+        session_id = session["id"]
			
 
				+        session_url = f"{self.base_url}/imports/{session_id}"
			
 
				+
			
 
				+        self.state = {
			
 
				+            "client_job_id": client_job_id,
			
 
				+            "session_id": session_id,
			
 
				+            "mode": mode,
			
 
				+            "items": [],
			
 
				+        }
			
 
				+        self.write_state()
			
 
				+
			
 
				+        print_scan_summary(candidates, mode)
			
 
				+
			
 
				+        uploaded = []
			
 
				+        failures = 0
			
 
				+
			
 
				+        for index, candidate in enumerate(candidates, start=1):
			
 
				+            label = candidate["original_name"]
			
 
				+            info(f"[{index}/{len(candidates)}] Uploading {label}")
			
 
				+            try:
			
 
				+                response = self.create_item(session_id, candidate)
			
 
				+                item = response["item"]
			
 
				+                uploaded.append({
			
 
				+                    "client_item_id": candidate["client_item_id"],
			
 
				+                    "item_id": item["id"],
			
 
				+                    "info_hash": candidate.get("info_hash"),
			
 
				+                    "status": item["status"],
			
 
				+                    "name": candidate["original_name"],
			
 
				+                    "source_kind": candidate["source_kind"],
			
 
				+                })
			
 
				+            except RuntimeError as error:
			
 
				+                failures += 1
			
 
				+                warn(f"{label}: {error}")
			
 
				+                uploaded.append({
			
 
				+                    "client_item_id": candidate["client_item_id"],
			
 
				+                    "info_hash": candidate.get("info_hash"),
			
 
				+                    "status": "failed",
			
 
				+                    "name": candidate["original_name"],
			
 
				+                    "source_kind": candidate["source_kind"],
			
 
				+                    "error": str(error),
			
 
				+                })
			
 
				+
			
 
				+            self.state["items"] = uploaded
			
 
				+            self.write_state()
			
 
				+
			
 
				+        print("")
			
 
				+        print("Import session created.")
			
 
				+        print(f"Session ID : {session_id}")
			
 
				+        print(f"Review URL : {session_url}")
			
 
				+        print(f"Uploaded   : {len(candidates) - failures}/{len(candidates)} item(s)")
			
 
				+        if failures:
			
 
				+            print(f"Failed     : {failures}")
			
 
				+        print(f"State file : {self.state_path}")
			
 
				+        print("")
			
 
				+        print("Next steps:")
			
 
				+        print("1. Open the review URL in Nostradamus")
			
 
				+        print("2. Review the imported items on the website")
			
 
				+        print("3. Finalize the items you want to send into pending moderation")
			
 
				+        print("4. After approval, download the prepared .torrent from the site")
			
 
				+
			
 
				+        return 0 if failures == 0 else 1
			
 
				+
			
 
				+    def create_session(self, client_job_id: str, mode: str) -> dict:
			
 
				+        response = self.request("POST", "/api/import/sessions", {
			
 
				+            "client_job_id": client_job_id,
			
 
				+            "mode": mode,
			
 
				+        })
			
 
				+        return response["data"]
			
 
				+
			
 
				+    def create_item(self, session_id: str, payload: dict) -> dict:
			
 
				+        response = self.request("POST", f"/api/import/sessions/{session_id}/items", payload)
			
 
				+        return response["data"]
			
 
				+
			
 
				+    def request(self, method: str, path: str, payload: Optional[dict] = None) -> dict:
			
 
				+        url = f"{self.base_url}{path}"
			
 
				+        body = None
			
 
				+        headers = {"x-importer-token": self.importer_token, "accept": "application/json"}
			
 
				+
			
 
				+        if payload is not None:
			
 
				+            body = json.dumps(payload).encode("utf-8")
			
 
				+            headers["content-type"] = "application/json"
			
 
				+
			
 
				+        request = urllib.request.Request(url, data=body, method=method, headers=headers)
			
 
				+
			
 
				+        try:
			
 
				+            with urllib.request.urlopen(request, timeout=self.timeout) as response:
			
 
				+                raw = response.read().decode("utf-8")
			
 
				+                return json.loads(raw) if raw else {}
			
 
				+        except urllib.error.HTTPError as error:
			
 
				+            body_text = error.read().decode("utf-8", errors="replace")
			
 
				+            try:
			
 
				+                parsed = json.loads(body_text)
			
 
				+                message = parsed.get("error", body_text)
			
 
				+            except json.JSONDecodeError:
			
 
				+                message = body_text
			
 
				+            raise RuntimeError(f"{method} {path} failed with {error.code}: {message}") from error
			
 
				+        except urllib.error.URLError as error:
			
 
				+            raise RuntimeError(f"{method} {path} failed: {error}") from error
			
 
				+
			
 
				+    def collect_items(self) -> List[dict]:
			
 
				+        torrent_paths = self.expand_torrent_paths()
			
 
				+        data_paths = self.expand_data_paths()
			
 
				+        data_matcher = self.build_data_path_matcher(data_paths)
			
 
				+        matched_data_paths = set()
			
 
				+        items: List[dict] = []
			
 
				+
			
 
				+        for torrent_path in torrent_paths:
			
 
				+            parsed = self.parse_torrent_file(torrent_path)
			
 
				+            if parsed is None:
			
 
				+                continue
			
 
				+
			
 
				+            matched_data_path = self.match_data_path(parsed.name, data_matcher)
			
 
				+            if matched_data_path is not None:
			
 
				+                matched_data_paths.add(matched_data_path)
			
 
				+
			
 
				+            item = self.build_cross_seed_item(torrent_path, parsed, matched_data_path)
			
 
				+            if item:
			
 
				+                items.append(item)
			
 
				+
			
 
				+        for data_path in data_paths:
			
 
				+            if data_path in matched_data_paths:
			
 
				+                continue
			
 
				+
			
 
				+            item = self.build_data_only_item(data_path)
			
 
				+            if item:
			
 
				+                items.append(item)
			
 
				+
			
 
				+        deduped: Dict[str, dict] = {}
			
 
				+        unnamed: List[dict] = []
			
 
				+
			
 
				+        for item in items:
			
 
				+            info_hash = item.get("info_hash")
			
 
				+            if info_hash:
			
 
				+                deduped[info_hash] = item
			
 
				+            else:
			
 
				+                unnamed.append(item)
			
 
				+
			
 
				+        return list(deduped.values()) + unnamed
			
 
				+
			
 
				+    def expand_torrent_paths(self) -> List[Path]:
			
 
				+        paths: List[Path] = []
			
 
				+
			
 
				+        for raw in self.args.torrent or []:
			
 
				+            path = Path(raw).expanduser()
			
 
				+            if path.is_file():
			
 
				+                paths.append(path)
			
 
				+
			
 
				+        for raw in self.args.torrent_root or []:
			
 
				+            root = Path(raw).expanduser()
			
 
				+            if root.is_dir():
			
 
				+                paths.extend(sorted(root.rglob("*.torrent")))
			
 
				+
			
 
				+        return sorted(set(paths))
			
 
				+
			
 
				+    def expand_data_paths(self) -> List[Path]:
			
 
				+        paths: List[Path] = []
			
 
				+
			
 
				+        for raw in self.args.path or []:
			
 
				+            path = Path(raw).expanduser()
			
 
				+            if path.exists():
			
 
				+                paths.append(path)
			
 
				+
			
 
				+        for raw in self.args.data_root or []:
			
 
				+            root = Path(raw).expanduser()
			
 
				+            if root.is_dir():
			
 
				+                for child in sorted(root.iterdir()):
			
 
				+                    if child.name.startswith("."):
			
 
				+                        continue
			
 
				+                    paths.append(child)
			
 
				+
			
 
				+        return [path for path in sorted(set(paths)) if path.suffix.lower() != ".torrent"]
			
 
				+
			
 
				+    def infer_mode(self, items: Sequence[dict]) -> str:
			
 
				+        kinds = {item["source_kind"] for item in items}
			
 
				+        if kinds == {"cross_seed"}:
			
 
				+            return "cross_seed"
			
 
				+        if kinds == {"data_only"}:
			
 
				+            return "data_only"
			
 
				+        return "mixed"
			
 
				+
			
 
				+    def build_data_path_matcher(self, paths: Sequence[Path]) -> Dict[str, List[Path]]:
			
 
				+        matcher: Dict[str, List[Path]] = {}
			
 
				+        for path in paths:
			
 
				+            for key in data_match_keys(path.name):
			
 
				+                matcher.setdefault(key, []).append(path)
			
 
				+        return matcher
			
 
				+
			
 
				+    def match_data_path(self, torrent_name: str, matcher: Dict[str, List[Path]]) -> Optional[Path]:
			
 
				+        for key in data_match_keys(torrent_name):
			
 
				+            candidates = matcher.get(key) or []
			
 
				+            while candidates:
			
 
				+                candidate = candidates.pop(0)
			
 
				+                if candidate.exists():
			
 
				+                    return candidate
			
 
				+        return None
			
 
				+
			
 
				+    def build_cross_seed_item(
			
 
				+        self,
			
 
				+        torrent_path: Path,
			
 
				+        parsed: ParsedTorrent,
			
 
				+        matched_data_path: Optional[Path],
			
 
				+    ) -> dict:
			
 
				+        nfo_content = load_adjacent_nfo([matched_data_path, torrent_path])
			
 
				+        local_path_hint = str(matched_data_path or torrent_path.parent)
			
 
				+
			
 
				+        return {
			
 
				+            "client_item_id": stable_client_item_id(parsed.info_hash),
			
 
				+            "source_kind": "cross_seed",
			
 
				+            "original_name": parsed.name,
			
 
				+            "local_path_hint": local_path_hint,
			
 
				+            "info_hash": parsed.info_hash,
			
 
				+            "size": parsed.size,
			
 
				+            "raw_torrent": base64.b64encode(parsed.binary).decode("ascii"),
			
 
				+            "raw_nfo": nfo_content,
			
 
				+            "file_list": [{"path": path, "size": size} for path, size in parsed.files.items()],
			
 
				+            "detected_facts": {
			
 
				+                "source_path": str(torrent_path),
			
 
				+                "matched_data_path": str(matched_data_path) if matched_data_path else None,
			
 
				+                "has_nfo": bool(nfo_content),
			
 
				+                "file_count": len(parsed.files),
			
 
				+            },
			
 
				+        }
			
 
				+
			
 
				+    def build_data_only_item(self, data_path: Path) -> Optional[dict]:
			
 
				+        info(f"Hashing data for {data_path.name}")
			
 
				+        torrent_binary, parsed = self.create_torrent_from_path(data_path)
			
 
				+        nfo_content = load_adjacent_nfo([data_path])
			
 
				+
			
 
				+        return {
			
 
				+            "client_item_id": stable_client_item_id(parsed.info_hash),
			
 
				+            "source_kind": "data_only",
			
 
				+            "original_name": parsed.name,
			
 
				+            "local_path_hint": str(data_path),
			
 
				+            "info_hash": parsed.info_hash,
			
 
				+            "size": parsed.size,
			
 
				+            "raw_torrent": base64.b64encode(torrent_binary).decode("ascii"),
			
 
				+            "raw_nfo": nfo_content,
			
 
				+            "file_list": [{"path": path, "size": size} for path, size in parsed.files.items()],
			
 
				+            "detected_facts": {
			
 
				+                "source_path": str(data_path),
			
 
				+                "has_nfo": bool(nfo_content),
			
 
				+                "file_count": len(parsed.files),
			
 
				+            },
			
 
				+        }
			
 
				+
			
 
				+    def parse_torrent_file(self, path: Path) -> Optional[ParsedTorrent]:
			
 
				+        try:
			
 
				+            binary = path.read_bytes()
			
 
				+            data, info_raw = Bencode.decode_torrent(binary)
			
 
				+            info_dict = data["info"]
			
 
				+            info_hash = hashlib.sha1(info_raw).hexdigest()
			
 
				+            files = torrent_files(info_dict)
			
 
				+            size = sum(files.values())
			
 
				+            return ParsedTorrent(
			
 
				+                name=str(info_dict["name"]),
			
 
				+                info_hash=info_hash,
			
 
				+                size=size,
			
 
				+                files=files,
			
 
				+                data=data,
			
 
				+                binary=binary,
			
 
				+                info_raw=info_raw,
			
 
				+            )
			
 
				+        except Exception as error:
			
 
				+            warn(f"Failed to parse {path}: {error}")
			
 
				+            return None
			
 
				+
			
 
				+    def create_torrent_from_path(self, path: Path) -> Tuple[bytes, ParsedTorrent]:
			
 
				+        info_dict = build_info_dict(path)
			
 
				+        torrent_data = {
			
 
				+            "created by": "Nostradamus",
			
 
				+            "creation date": int(time.time()),
			
 
				+            "comment": "Proudly generated for Nostradamus",
			
 
				+            "info": info_dict,
			
 
				+        }
			
 
				+        torrent_binary = Bencode.encode(torrent_data)
			
 
				+        parsed = ParsedTorrent(
			
 
				+            name=str(info_dict["name"]),
			
 
				+            info_hash=hashlib.sha1(Bencode.encode(info_dict)).hexdigest(),
			
 
				+            size=sum(torrent_files(info_dict).values()),
			
 
				+            files=torrent_files(info_dict),
			
 
				+            data=torrent_data,
			
 
				+            binary=torrent_binary,
			
 
				+            info_raw=Bencode.encode(info_dict),
			
 
				+        )
			
 
				+        return torrent_binary, parsed
			
 
				+
			
 
				+    def write_state(self) -> None:
			
 
				+        try:
			
 
				+            self.state_path.write_text(json.dumps(self.state, indent=2, sort_keys=True), encoding="utf-8")
			
 
				+        except OSError as error:
			
 
				+            warn(f"Could not write state file {self.state_path}: {error}")
			
 
				+
			
 
				+
			
 
				+def validate_base_url(url: str, allow_insecure_http: bool) -> str:
			
 
				+    parsed = urllib.parse.urlparse(url)
			
 
				+    if parsed.scheme not in {"http", "https"} or not parsed.netloc:
			
 
				+        fatal("--base-url must be a full URL like https://nostradamus.foo")
			
 
				+
			
 
				+    if parsed.scheme == "http" and not allow_insecure_http and parsed.hostname not in {"127.0.0.1", "localhost"}:
			
 
				+        fatal("Refusing insecure HTTP for a non-local host. Use HTTPS or pass --allow-insecure-http.")
			
 
				+
			
 
				+    return parsed.geturl().rstrip("/")
			
 
				+
			
 
				+
			
 
				+def load_adjacent_nfo(candidates: Sequence[Optional[Path]]) -> Optional[str]:
			
 
				+    visited = set()
			
 
				+
			
 
				+    for candidate in candidates:
			
 
				+        if candidate is None:
			
 
				+            continue
			
 
				+
			
 
				+        candidate = candidate.expanduser()
			
 
				+        search_roots = []
			
 
				+        if candidate.is_dir():
			
 
				+            search_roots.append(candidate)
			
 
				+        elif candidate.exists():
			
 
				+            search_roots.append(candidate.parent)
			
 
				+
			
 
				+        for root in search_roots:
			
 
				+            if root in visited:
			
 
				+                continue
			
 
				+            visited.add(root)
			
 
				+
			
 
				+            for entry in sorted(root.iterdir()):
			
 
				+                if entry.suffix.lower() in TEXT_EXTS and entry.suffix.lower() == ".nfo":
			
 
				+                    try:
			
 
				+                        return entry.read_text(encoding="utf-8", errors="replace")[:500_000]
			
 
				+                    except OSError:
			
 
				+                        continue
			
 
				+
			
 
				+    return None
			
 
				+
			
 
				+
			
 
				+def torrent_files(info_dict: dict) -> Dict[str, int]:
			
 
				+    if "files" in info_dict:
			
 
				+        return {
			
 
				+            "/".join(str(part) for part in file_entry["path"]): int(file_entry["length"])
			
 
				+            for file_entry in info_dict["files"]
			
 
				+        }
			
 
				+    return {str(info_dict["name"]): int(info_dict["length"])}
			
 
				+
			
 
				+
			
 
				+def build_info_dict(path: Path) -> dict:
			
 
				+    piece_length = choose_piece_length(path)
			
 
				+    pieces = compute_pieces(path, piece_length)
			
 
				+    info_dict: Dict[str, Any] = {
			
 
				+        "name": path.name,
			
 
				+        "piece length": piece_length,
			
 
				+        "pieces": pieces,
			
 
				+        "private": 1,
			
 
				+        "source": "Nostradamus",
			
 
				+    }
			
 
				+
			
 
				+    if path.is_file():
			
 
				+        info_dict["length"] = path.stat().st_size
			
 
				+    else:
			
 
				+        files = []
			
 
				+        for file_path in sorted(p for p in path.rglob("*") if p.is_file()):
			
 
				+            files.append({
			
 
				+                "length": file_path.stat().st_size,
			
 
				+                "path": list(file_path.relative_to(path).parts),
			
 
				+            })
			
 
				+        info_dict["files"] = files
			
 
				+
			
 
				+    return info_dict
			
 
				+
			
 
				+
			
 
				+def choose_piece_length(path: Path) -> int:
			
 
				+    total_size = total_path_size(path)
			
 
				+    if total_size < 1 * 1024**3:
			
 
				+        return 256 * 1024
			
 
				+    if total_size < 4 * 1024**3:
			
 
				+        return 512 * 1024
			
 
				+    if total_size < 16 * 1024**3:
			
 
				+        return 1024 * 1024
			
 
				+    return 2 * 1024 * 1024
			
 
				+
			
 
				+
			
 
				+def compute_pieces(path: Path, piece_length: int) -> bytes:
			
 
				+    digest = []
			
 
				+    buffer = bytearray()
			
 
				+
			
 
				+    for chunk in iter_path_chunks(path):
			
 
				+        buffer.extend(chunk)
			
 
				+        while len(buffer) >= piece_length:
			
 
				+            piece = bytes(buffer[:piece_length])
			
 
				+            digest.append(hashlib.sha1(piece).digest())
			
 
				+            del buffer[:piece_length]
			
 
				+
			
 
				+    if buffer:
			
 
				+        digest.append(hashlib.sha1(bytes(buffer)).digest())
			
 
				+
			
 
				+    return b"".join(digest)
			
 
				+
			
 
				+
			
 
				+def iter_path_chunks(path: Path, chunk_size: int = 1024 * 1024) -> Iterable[bytes]:
			
 
				+    files = [path] if path.is_file() else sorted(p for p in path.rglob("*") if p.is_file())
			
 
				+    for file_path in files:
			
 
				+        with file_path.open("rb") as handle:
			
 
				+            while True:
			
 
				+                chunk = handle.read(chunk_size)
			
 
				+                if not chunk:
			
 
				+                    break
			
 
				+                yield chunk
			
 
				+
			
 
				+
			
 
				+def total_path_size(path: Path) -> int:
			
 
				+    if path.is_file():
			
 
				+        return path.stat().st_size
			
 
				+    return sum(file_path.stat().st_size for file_path in path.rglob("*") if file_path.is_file())
			
 
				+
			
 
				+
			
 
				+def data_match_keys(name: str) -> List[str]:
			
 
				+    path = Path(name)
			
 
				+    raw = [name, path.stem]
			
 
				+    normalized = [normalize_key(value) for value in raw]
			
 
				+    return [key for key in dict.fromkeys(raw + normalized) if key]
			
 
				+
			
 
				+
			
 
				+def normalize_key(value: str) -> str:
			
 
				+    import re
			
 
				+
			
 
				+    return re.sub(r"[^a-z0-9]+", "", value.lower())
			
 
				+
			
 
				+
			
 
				+def stable_client_item_id(info_hash: str) -> str:
			
 
				+    return f"item-{info_hash[:16]}"
			
 
				+
			
 
				+
			
 
				+def default_client_job_id() -> str:
			
 
				+    return f"import-{int(time.time())}-{secrets.token_hex(4)}"
			
 
				+
			
 
				+
			
 
				+def print_scan_summary(candidates: Sequence[dict], mode: str) -> None:
			
 
				+    counts = {"cross_seed": 0, "data_only": 0}
			
 
				+    for candidate in candidates:
			
 
				+        counts[candidate["source_kind"]] += 1
			
 
				+
			
 
				+    print("")
			
 
				+    print("Local scan complete.")
			
 
				+    print(f"Mode       : {mode}")
			
 
				+    print(f"Candidates : {len(candidates)}")
			
 
				+    print(f"Cross-seed : {counts['cross_seed']}")
			
 
				+    print(f"Data-only  : {counts['data_only']}")
			
 
				+    print("")
			
 
				+
			
 
				+
			
 
				+def info(message: str) -> None:
			
 
				+    print(f"==> {message}")
			
 
				+
			
 
				+
			
 
				+def warn(message: str) -> None:
			
 
				+    print(f"[warn] {message}", file=sys.stderr)
			
 
				+
			
 
				+
			
 
				+def fatal(message: str) -> None:
			
 
				+    print(f"[error] {message}", file=sys.stderr)
			
 
				+    raise SystemExit(1)
			
 
				+
			
 
				+
			
 
				+def build_parser() -> argparse.ArgumentParser:
			
 
				+    parser = argparse.ArgumentParser(
			
 
				+        description="Official client for the Nostradamus upload API"
			
 
				+    )
			
 
				+    parser.add_argument("--base-url", required=True, help="Nostradamus base URL, for example https://nostradamus.foo")
			
 
				+    parser.add_argument("--importer-token", required=True, help="Dedicated importer token from Nostradamus settings")
			
 
				+    parser.add_argument("--torrent-root", action="append", help="Directory containing existing .torrent files")
			
 
				+    parser.add_argument("--torrent", action="append", help="Single .torrent file to import")
			
 
				+    parser.add_argument(
			
 
				+        "--data-root",
			
 
				+        action="append",
			
 
				+        help="Directory whose direct children should be imported as separate data-only items",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "--path",
			
 
				+        action="append",
			
 
				+        help="Single file or directory to import as exactly one data-only item",
			
 
				+    )
			
 
				+    parser.add_argument("--client-job-id", help="Optional stable client job id for the session")
			
 
				+    parser.add_argument("--state-file", default=DEFAULT_STATE_FILE, help=f"Local state file path (default: {DEFAULT_STATE_FILE})")
			
 
				+    parser.add_argument("--timeout", type=int, default=DEFAULT_TIMEOUT, help=f"HTTP timeout in seconds (default: {DEFAULT_TIMEOUT})")
			
 
				+    parser.add_argument("--allow-insecure-http", action="store_true", help="Allow plain HTTP for non-local hosts")
			
 
				+    return parser
			
 
				+
			
 
				+
			
 
				+def main(argv: Optional[Sequence[str]] = None) -> int:
			
 
				+    parser = build_parser()
			
 
				+    args = parser.parse_args(argv)
			
 
				+    uploader = ImportUploader(args)
			
 
				+    return uploader.run()
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    raise SystemExit(main())