Stage 1 (before OpenAI rewrite): reject if raw content < pipeline_min_words_raw (default 120) Stage 2 (after rewrite): reject if rewritten text < pipeline_min_words_rewritten (default 150) Both stages set status='error' with a descriptive note and skip WP draft creation. The reserved publish slot is released so it stays available for the next article. Quality rejections don't abort the pipeline — processing continues with the next article. New config settings (overridable via .env): PIPELINE_MIN_WORDS_RAW=120 PIPELINE_MIN_WORDS_REWRITTEN=150 Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
64 lines
2.7 KiB
Python
64 lines
2.7 KiB
Python
from functools import lru_cache
|
|
from pathlib import Path
|
|
|
|
from dotenv import load_dotenv
|
|
from pydantic import AliasChoices, Field
|
|
from pydantic_settings import BaseSettings, SettingsConfigDict
|
|
|
|
|
|
class Settings(BaseSettings):
|
|
# Prefer backend-specific env file to avoid collisions with legacy root .env
|
|
model_config = SettingsConfigDict(
|
|
env_file=("backend/.env", ".env"),
|
|
env_file_encoding="utf-8",
|
|
extra="ignore",
|
|
)
|
|
|
|
app_env: str = "development"
|
|
app_name: str = "rss-news-backend"
|
|
app_secret_key: str = "replace-with-a-long-random-secret"
|
|
|
|
app_admin_username: str = "admin"
|
|
app_admin_password: str = "change-me"
|
|
|
|
session_cookie_name: str = "rss_news_session"
|
|
session_max_age_seconds: int = 28800
|
|
|
|
app_db_path: str = "backend/data/rss_news.db"
|
|
|
|
wordpress_base_url: str | None = Field(default=None, validation_alias=AliasChoices("WORDPRESS_BASE_URL", "WP_BASE_URL"))
|
|
wordpress_username: str | None = Field(default=None, validation_alias=AliasChoices("WORDPRESS_USERNAME", "WP_USERNAME"))
|
|
wordpress_app_password: str | None = Field(default=None, validation_alias=AliasChoices("WORDPRESS_APP_PASSWORD", "WP_PASSWORD"))
|
|
wordpress_default_status: str = "draft"
|
|
openai_api_key: str | None = Field(default=None, validation_alias=AliasChoices("OPENAI_API_KEY"))
|
|
openai_model: str = "gpt-4o-mini"
|
|
|
|
# Telegram Bot
|
|
telegram_bot_token: str | None = Field(default=None, validation_alias=AliasChoices("TELEGRAM_BOT_TOKEN"))
|
|
telegram_chat_id: str | None = Field(default=None, validation_alias=AliasChoices("TELEGRAM_CHAT_ID"))
|
|
telegram_webhook_secret: str | None = Field(default=None, validation_alias=AliasChoices("TELEGRAM_WEBHOOK_SECRET"))
|
|
|
|
# N8N API authentication
|
|
n8n_api_key: str | None = Field(default=None, validation_alias=AliasChoices("N8N_API_KEY"))
|
|
|
|
# Pipeline behaviour
|
|
pipeline_relevance_auto: int = 80 # >= this: auto-process
|
|
pipeline_relevance_warn: int = 60 # >= this: Telegram warning, else reject
|
|
pipeline_max_drafts_per_day: int = 2
|
|
pipeline_publish_hours: str = "9,14" # comma-separated preferred publish hours (CET)
|
|
pipeline_min_words_raw: int = 120 # minimum words in raw content before rewrite (else reject)
|
|
pipeline_min_words_rewritten: int = 150 # minimum words in rewritten content (else reject)
|
|
|
|
|
|
@lru_cache(maxsize=1)
|
|
def get_settings() -> Settings:
|
|
# Prefer shared legacy env from the original rss-news workspace if present.
|
|
env_candidates = (
|
|
Path("/Users/oliver/Documents/rss-news/.env"),
|
|
Path("backend/.env"),
|
|
Path(".env"),
|
|
)
|
|
for env_path in env_candidates:
|
|
if env_path.exists():
|
|
load_dotenv(env_path, override=False)
|
|
return Settings()
|