from functools import lru_cache from pydantic import Field from pydantic_settings import BaseSettings, SettingsConfigDict class Settings(BaseSettings): model_config = SettingsConfigDict(env_file=".env", extra="ignore", case_sensitive=False) database_url: str = Field( default="postgresql+psycopg://goon:goon@localhost:5432/goon", validation_alias="DATABASE_URL", ) tpdb_api_token: str | None = Field(default=None, validation_alias="TPDB_API_TOKEN") tpdb_base_url: str = Field( default="https://api.theporndb.net", validation_alias="TPDB_BASE_URL" ) stashdb_api_key: str | None = Field(default=None, validation_alias="STASHDB_API_KEY") stashdb_graphql_url: str = Field( default="https://stashdb.org/graphql", validation_alias="STASHDB_GRAPHQL_URL" ) log_level: str = Field(default="INFO", validation_alias="LOG_LEVEL") # Sentry observability — pusty DSN = init no-op (devel/local). Cloud free tier # 5k errors/mies wystarczy dla 1-user app. sentry_dsn: str | None = Field(default=None, validation_alias="SENTRY_DSN") sentry_environment: str = Field(default="dev", validation_alias="SENTRY_ENVIRONMENT") sentry_traces_sample_rate: float = Field( default=0.1, validation_alias="SENTRY_TRACES_SAMPLE_RATE" ) api_keys_raw: str = Field(default="", validation_alias="API_KEYS") """Lista API keys oddzielona przecinkami. Pusta = auth wyłączony (tylko dev/local).""" allowed_app_sig_hashes_raw: str = Field(default="", validation_alias="ALLOWED_APP_SIG_HASH") """Whitelist SHA256 (hex) podpisów APK akceptowane przez backend. Każdy request mobile wysyła `X-App-Signature` z hashem signing certu (PackageManager.GET_SIGNING_CERTIFICATES). Pusta = check wyłączony (dev/wstępny rollout). Lista = comma-separated lowercase hex. Re-packaging APK innym keystorem zmienia hash → 403.""" auto_merge_threshold: float = 0.92 review_threshold: float = 0.75 fingerprint_hamming_max: int = 5 title_token_set_min: int = 88 date_window_days: int = 7 # Skip ingestu clip-store (ManyVids/IWantClips/Clips4Sale/...) z canonical source — # to permanentne orphany (free tubes nie hostują), ~56% ingestu TPDB/StashDB. # False = wciągaj jak dawniej. Tube'y z clip-store studiem NIE są skipowane (mają playback). skip_clip_store: bool = Field(default=True, validation_alias="GOON_SKIP_CLIP_STORE") # Minimalny duration sceny z tube/scraper przy ingescie — ) przestał dawać nowe sceny > próg. Łapie zamrożenie # pojedynczego origin, którego globalny monitor (jeden Source "tube-scraper") nie # widzi (np. freshporno browse z rotującego roota, report 14f3a655). 6h cadence # (po browse-latest). Każdy 0/None = wyłączony. sched_ingest_watchdog_hours: int = Field( default=6, validation_alias="GOON_SCHED_INGEST_WATCHDOG_HOURS" ) # Próg dla browse-scraperów (ALL_BROWSE_SCRAPERS) — crawlowane raz dziennie z # listingu, więc 48h ciszy = anomalia. ingest_watchdog_max_age_hours: int = Field( default=48, validation_alias="GOON_INGEST_WATCHDOG_MAX_AGE_HOURS" ) # Próg dla performer-driven search-scraperów (ALL_DIRECT_SCRAPERS) — kadencja jest # nierówna (continuous queue ~30d refresh per performer, ingest orphan-heavy), więc # 48h dawałoby false-positivy. 7d (168h): healthy search-tuby obserwowane <6h świeżości # (continuous tick hituje wszystkie tuby per performer), zamrożone ≥73h → ~28× margines. ingest_watchdog_search_max_age_hours: int = Field( default=168, validation_alias="GOON_INGEST_WATCHDOG_SEARCH_MAX_AGE_HOURS" ) # Taxonomy scene_count refresh — przelicza denormalizowane liczniki scen na # tags/performers/studios (hot-path /tags|/performers|/studios|/favorites czyta # gotową kolumnę zamiast agregować 6.3M scene_tags per-request). 3h cadence — # counts do tego stale, dla sortu "popular" + badge "(N)" bez znaczenia. 0 = off. sched_taxonomy_counts_hours: int = Field( default=3, validation_alias="GOON_SCHED_TAXONOMY_COUNTS_HOURS" ) # Hetzner Cloud bandwidth monitor — read-only API token (Security → API Tokens # w panelu Hetzner Cloud). Bez tokenu monitor wyłączony (warning w log). # Free traffic per server: CX22=20TB, CPX21=20TB itd. Overage = €1/TB. hetzner_api_token: str | None = Field(default=None, validation_alias="HETZNER_API_TOKEN") hetzner_server_id: int | None = Field(default=None, validation_alias="HETZNER_SERVER_ID") # Alert thresholds (% of included_traffic) — Sentry severity levels. hetzner_alert_info_pct: int = Field(default=50, validation_alias="HETZNER_ALERT_INFO_PCT") hetzner_alert_warning_pct: int = Field(default=80, validation_alias="HETZNER_ALERT_WARNING_PCT") hetzner_alert_error_pct: int = Field(default=95, validation_alias="HETZNER_ALERT_ERROR_PCT") # Cadence sprawdzania transferu (godziny). 0/None = monitor wyłączony. Domyślnie 6h # (transfer rośnie wolno; częściej bez sensu). Działa tylko gdy ustawiony token+id. sched_hetzner_monitor_hours: int = Field( default=6, validation_alias="GOON_SCHED_HETZNER_MONITOR_HOURS" ) # Bright Data ISP proxy (stałe IP od ISP, rozliczane ryczałtem NIE per-GB) — # używany do ingestu HTML (scrape) tubów które blokują VPS IP twardym Cloudflare # 403 nawet z browser-TLS (superporn). Streamu i tak nie ruszamy proxy (tokeny CDN # IP-bound). Format env: `host:port:user:pass` (panel Bright Data). Pusty = brak. brightdata_proxy_raw: str = Field(default="", validation_alias="BRIGHTDATA_PROXY_URL") @property def brightdata_proxy_url(self) -> str | None: """`host:port:user:pass` → `http://user:pass@host:port` dla curl_cffi/httpx. None gdy nieustawiony lub w złym formacie.""" parts = self.brightdata_proxy_raw.split(":") if len(parts) != 4 or not all(parts): return None host, port, user, pwd = parts return f"http://{user}:{pwd}@{host}:{port}" @property def api_keys(self) -> set[str]: return {k.strip() for k in self.api_keys_raw.split(",") if k.strip()} @property def auth_enabled(self) -> bool: return bool(self.api_keys) @property def allowed_app_sig_hashes(self) -> set[str]: return { h.strip().lower().replace(":", "") for h in self.allowed_app_sig_hashes_raw.split(",") if h.strip() } @property def app_sig_check_enabled(self) -> bool: return bool(self.allowed_app_sig_hashes) @lru_cache def get_settings() -> Settings: return Settings()