Files
diary-news/backend/app/models/source.py
Mavis d0d1014505 feat(db): 0003 migration + LlmSetting/Source 模型加 blocklist_tags
- 新增 alembic 0003: sources.blocklist_tags + llm_settings.blocklist_tags(JSONB)
- 两层配置:全局(llm_settings) + per-source(sources),合并去重后注入 classify prompt
- 默认空数组,不影响存量数据;admin API 在下个 commit 暴露编辑入口
2026-06-09 14:30:38 +08:00

74 lines
2.7 KiB
Python

"""采集源模型。"""
from __future__ import annotations
import enum
from datetime import datetime
from sqlalchemy import (
JSON,
Boolean,
DateTime,
Enum,
Integer,
String,
Text,
func,
)
from sqlalchemy.dialects.postgresql import JSONB
from sqlalchemy.orm import Mapped, mapped_column, relationship
from app.database import Base
class SourceKind(str, enum.Enum):
RSS = "rss"
HTML_LIST = "html_list"
TG_CHANNEL = "tg_channel"
class Source(Base):
__tablename__ = "sources"
id: Mapped[int] = mapped_column(primary_key=True)
name: Mapped[str] = mapped_column(String(128), nullable=False)
slug: Mapped[str] = mapped_column(String(128), unique=True, index=True, nullable=False)
kind: Mapped[SourceKind] = mapped_column(
Enum(
SourceKind,
name="source_kind",
values_callable=lambda x: [e.value for e in x],
),
default=SourceKind.RSS,
nullable=False,
)
url: Mapped[str] = mapped_column(Text, nullable=False)
detail_selector: Mapped[dict | None] = mapped_column(JSON)
fetch_interval_min: Mapped[int] = mapped_column(Integer, default=60, nullable=False)
fetch_cron: Mapped[str | None] = mapped_column(String(64)) # 5 段 cron
translate_to: Mapped[str] = mapped_column(String(8), default="zh", nullable=False)
enabled: Mapped[bool] = mapped_column(Boolean, default=True, nullable=False)
region: Mapped[str | None] = mapped_column(String(32), index=True)
language_src: Mapped[str | None] = mapped_column(String(8))
priority: Mapped[int] = mapped_column(Integer, default=50, nullable=False, index=True)
headers_json: Mapped[dict | None] = mapped_column(JSON)
# 源级屏蔽分类标签(如 ["体育", "娱乐"]);与 llm_settings.blocklist_tags 合并后使用
blocklist_tags: Mapped[list[str]] = mapped_column(
JSONB, nullable=False, default=list, server_default="[]"
)
last_fetched_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True))
last_status: Mapped[str | None] = mapped_column(String(64))
consecutive_failures: Mapped[int] = mapped_column(Integer, default=0, nullable=False)
created_at: Mapped[datetime] = mapped_column(
DateTime(timezone=True), server_default=func.now(), nullable=False
)
updated_at: Mapped[datetime] = mapped_column(
DateTime(timezone=True), server_default=func.now(), onupdate=func.now(), nullable=False
)
articles: Mapped[list["Article"]] = relationship( # noqa: F821
back_populates="source", cascade="all, delete-orphan", lazy="noload"
)
def __repr__(self) -> str:
return f"<Source id={self.id} slug={self.slug} kind={self.kind.value}>"