Add Comments

马一丁
Commit 3e4aa6366d3510d26056208115f909f90f27cec4 3e4aa636 1 parent 4846b1f7
Showing 12 changed files with 72 additions and 3 deletions
ReportEngine/agent.py
ReportEngine/core/chapter_storage.py
ReportEngine/core/stitcher.py
ReportEngine/core/template_parser.py
ReportEngine/flask_interface.py
ReportEngine/ir/validator.py
ReportEngine/llms/base.py
ReportEngine/nodes/chapter_generation_node.py
ReportEngine/nodes/document_layout_node.py
ReportEngine/nodes/word_budget_node.py
ReportEngine/renderers/html_renderer.py
ReportEngine/utils/config.py
--- a/ReportEngine/agent.py
View file @3e4aa63
+++ b/ReportEngine/agent.py
View file @3e4aa63
@@ -35,6 +35,7 @@ class FileCountBaseline:
     """文件数量基准管理器"""
     
     def __init__(self):
+         """在初始化阶段加载或创建文件数量基准快照"""
         self.baseline_file = 'logs/report_baseline.json'
         self.baseline_data = self._load_baseline()
     
--- a/ReportEngine/core/chapter_storage.py
View file @3e4aa63
+++ b/ReportEngine/core/chapter_storage.py
View file @3e4aa63
@@ -29,6 +29,7 @@ class ChapterRecord:
     updated_at: str = field(default_factory=lambda: datetime.utcnow().isoformat() + "Z")
 
     def to_dict(self) -> Dict[str, object]:
+         """将记录转换为便于写入manifest.json的序列化字典"""
         return {
             "chapterId": self.chapter_id,
             "slug": self.slug,
@@ -54,6 +55,12 @@ class ChapterStorage:
     """
 
     def __init__(self, base_dir: str):
+         """
+         创建章节存储器。
+ 
+         Args:
+             base_dir: 所有输出run目录的根路径
+         """
         self.base_dir = Path(base_dir)
         self.base_dir.mkdir(parents=True, exist_ok=True)
         self._manifests: Dict[str, Dict[str, object]] = {}
@@ -133,6 +140,7 @@ class ChapterStorage:
         return final_path
 
     def load_chapters(self, run_dir: Path) -> List[Dict[str, object]]:
+         """从指定run目录读取全部chapter.json并按order排序返回"""
         payloads: List[Dict[str, object]] = []
         for child in sorted(run_dir.iterdir()):
             if not child.is_dir():
@@ -161,6 +169,7 @@ class ChapterStorage:
     # ======== 内部工具 ========
 
     def _chapter_dir(self, run_dir: Path, slug: str, order: int) -> Path:
+         """根据slug/order生成稳定的章节目录，确保各章分隔存盘"""
         safe_slug = self._safe_slug(slug)
         folder = f"{order:03d}-{safe_slug}"
         path = run_dir / folder
@@ -168,25 +177,31 @@ class ChapterStorage:
         return path
 
     def _safe_slug(self, slug: str) -> str:
+         """移除危险字符，避免生成非法文件夹名"""
         slug = slug.replace(" ", "-").replace("/", "-")
         return slug or "section"
 
     def _raw_stream_path(self, chapter_dir: Path) -> Path:
+         """返回某章节流式输出对应的raw文件路径"""
         return chapter_dir / "stream.raw"
 
     def _key(self, run_dir: Path) -> str:
+         """将run目录解析为字典缓存的键，避免重复读取磁盘"""
         return str(run_dir.resolve())
 
     def _manifest_path(self, run_dir: Path) -> Path:
+         """获取manifest.json的实际文件路径"""
         return run_dir / "manifest.json"
 
     def _write_manifest(self, run_dir: Path, manifest: Dict[str, object]):
+         """将内存中的manifest快照全量写回磁盘"""
         self._manifest_path(run_dir).write_text(
             json.dumps(manifest, ensure_ascii=False, indent=2),
             encoding="utf-8",
         )
 
     def _read_manifest(self, run_dir: Path) -> Dict[str, object]:
+         """从磁盘读取已有manifest，用于进程重启或多实例协作"""
         manifest_path = self._manifest_path(run_dir)
         if manifest_path.exists():
             return json.loads(manifest_path.read_text(encoding="utf-8"))
--- a/ReportEngine/core/stitcher.py
View file @3e4aa63
+++ b/ReportEngine/core/stitcher.py
View file @3e4aa63
@@ -16,6 +16,7 @@ class DocumentComposer:
     """
 
     def __init__(self):
+         """初始化装订器并记录已使用的锚点，避免重复"""
         self._seen_anchors: Set[str] = set()
 
     def build_document(
--- a/ReportEngine/core/template_parser.py
View file @3e4aa63
+++ b/ReportEngine/core/template_parser.py
View file @3e4aa63
@@ -30,6 +30,7 @@ class TemplateSection:
     outline: List[str] = field(default_factory=list)
 
     def to_dict(self) -> dict:
+         """将章节实体序列化为字典，方便传给LLM或落盘"""
         return {
             "title": self.title,
             "slug": self.slug,
@@ -185,6 +186,7 @@ def _build_slug(number: str, title: str) -> str:
 
 
 def _slugify_text(text: str) -> str:
+     """对任意文本做降噪与转写，得到URL友好的slug片段"""
     text = unicodedata.normalize("NFKD", text)
     text = text.replace("·", "-").replace(" ", "-")
     text = re.sub(r"[^0-9a-zA-Z\u4e00-\u9fff-]+", "-", text)
@@ -193,6 +195,7 @@ def _slugify_text(text: str) -> str:
 
 
 def _ensure_unique_slug(slug: str, used: set) -> str:
+     """若slug重复则自动追加序号，直到在used集合中唯一"""
     if slug not in used:
         used.add(slug)
         return slug
--- a/ReportEngine/flask_interface.py
View file @3e4aa63
+++ b/ReportEngine/flask_interface.py
View file @3e4aa63
@@ -40,6 +40,14 @@ class ReportTask:
     """报告生成任务"""
 
     def __init__(self, query: str, task_id: str, custom_template: str = ""):
+         """
+         初始化任务对象，记录查询词、自定义模板与运行期元数据。
+ 
+         Args:
+             query: 最终需要生成的报告主题
+             task_id: 任务唯一ID，通常由时间戳构造
+             custom_template: 可选的自定义Markdown模板
+         """
         self.task_id = task_id
         self.query = query
         self.custom_template = custom_template
@@ -470,6 +478,7 @@ def get_templates():
 # 错误处理
 @report_bp.errorhandler(404)
 def not_found(error):
+     """404兜底处理：保证接口统一返回JSON结构"""
     logger.exception(f"API端点不存在: {str(error)}")
     return jsonify({
         'success': False,
@@ -479,6 +488,7 @@ def not_found(error):
 
 @report_bp.errorhandler(500)
 def internal_error(error):
+     """500兜底处理：捕获未被主动捕获的异常"""
     logger.exception(f"服务器内部错误: {str(error)}")
     return jsonify({
         'success': False,
--- a/ReportEngine/ir/validator.py
View file @3e4aa63
+++ b/ReportEngine/ir/validator.py
View file @3e4aa63
@@ -23,6 +23,7 @@ class IRValidator:
     """
 
     def __init__(self, schema_version: str = IR_VERSION):
+         """记录当前Schema版本，便于未来多版本并存"""
         self.schema_version = schema_version
 
     # ======== 对外接口 ========
--- a/ReportEngine/llms/base.py
View file @3e4aa63
+++ b/ReportEngine/llms/base.py
View file @3e4aa63
 """
- Unified OpenAI-compatible LLM client for the Report Engine, with retry support.
+ Report Engine 默认的OpenAI兼容LLM客户端封装，内置重试/流式能力。
 """
 
 import os
@@ -19,7 +19,9 @@ try:
     from retry_helper import with_retry, LLM_RETRY_CONFIG
 except ImportError:
     def with_retry(config=None):
+         """简化版with_retry占位，实现与真实装饰器一致的调用签名"""
         def decorator(func):
+             """直接返回原函数，确保无retry依赖时代码仍可运行"""
             return func
         return decorator
 
@@ -27,9 +29,17 @@ except ImportError:
 
 
 class LLMClient:
-     """Minimal wrapper around the OpenAI-compatible chat completion API."""
+     """针对OpenAI Chat Completion API的轻量封装，统一Report Engine调用入口。"""
 
     def __init__(self, api_key: str, model_name: str, base_url: Optional[str] = None):
+         """
+         初始化LLM客户端并保存基础连接信息。
+ 
+         Args:
+             api_key: 用于鉴权的API Token
+             model_name: 具体模型ID，用于定位供应商能力
+             base_url: 自定义兼容接口地址，默认为OpenAI官方
+         """
         if not api_key:
             raise ValueError("Report Engine LLM API key is required.")
         if not model_name:
@@ -55,6 +65,17 @@ class LLMClient:
 
     @with_retry(LLM_RETRY_CONFIG)
     def invoke(self, system_prompt: str, user_prompt: str, **kwargs) -> str:
+         """
+         以非流式方式调用LLM，并返回一次性完成的完整响应。
+ 
+         Args:
+             system_prompt: 系统角色提示
+             user_prompt: 用户高优先级指令
+             **kwargs: 允许透传temperature/top_p等采样参数
+ 
+         Returns:
+             去除首尾空白后的LLM响应文本
+         """
         messages = [
             {"role": "system", "content": system_prompt},
             {"role": "user", "content": user_prompt},
@@ -142,11 +163,13 @@ class LLMClient:
 
     @staticmethod
     def validate_response(response: Optional[str]) -> str:
+         """兜底处理None/空白字符串，防止上层逻辑崩溃"""
         if response is None:
             return ""
         return response.strip()
 
     def get_model_info(self) -> Dict[str, Any]:
+         """以字典形式返回当前客户端的模型/提供方/基础URL信息"""
         return {
             "provider": self.provider,
             "model": self.model_name,
--- a/ReportEngine/nodes/chapter_generation_node.py
View file @3e4aa63
+++ b/ReportEngine/nodes/chapter_generation_node.py
View file @3e4aa63
@@ -34,6 +34,14 @@ class ChapterGenerationNode(BaseNode):
     _COLON_EQUALS_PATTERN = re.compile(r'(":\s*)=')
 
     def __init__(self, llm_client, validator: IRValidator, storage: ChapterStorage):
+         """
+         记录LLM客户端/校验器/章节存储器，便于run方法调度。
+ 
+         Args:
+             llm_client: 实际调用大模型的客户端
+             validator: IR结构校验器
+             storage: 负责章节流式落盘的存储器
+         """
         super().__init__(llm_client, "ChapterGenerationNode")
         self.validator = validator
         self.storage = storage
@@ -385,6 +393,7 @@ class ChapterGenerationNode(BaseNode):
         """修正常见的结构性错误（例如list.items嵌套过深）"""
 
         def walk(blocks: List[Dict[str, Any]] | None):
+             """递归检查并修复嵌套结构，保证每个block合法"""
             if not isinstance(blocks, list):
                 return
             for block in blocks:
@@ -485,6 +494,7 @@ class ChapterGenerationNode(BaseNode):
 
     @staticmethod
     def _as_paragraph_block(text: str) -> Dict[str, Any]:
+         """将字符串快速包装成paragraph block，方便统一处理"""
         return {
             "type": "paragraph",
             "inlines": [{"text": text or ""}],
--- a/ReportEngine/nodes/document_layout_node.py
View file @3e4aa63
+++ b/ReportEngine/nodes/document_layout_node.py
View file @3e4aa63
@@ -21,6 +21,7 @@ class DocumentLayoutNode(BaseNode):
     """负责生成全局标题、目录与Hero设计"""
 
     def __init__(self, llm_client):
+         """记录LLM客户端并设置节点名字，供BaseNode日志使用"""
         super().__init__(llm_client, "DocumentLayoutNode")
 
     def run(
--- a/ReportEngine/nodes/word_budget_node.py
View file @3e4aa63
+++ b/ReportEngine/nodes/word_budget_node.py
View file @3e4aa63
@@ -21,6 +21,7 @@ class WordBudgetNode(BaseNode):
     """规划各章节字数与重点"""
 
     def __init__(self, llm_client):
+         """仅记录LLM客户端引用，方便run阶段发起请求"""
         super().__init__(llm_client, "WordBudgetNode")
 
     def run(
--- a/ReportEngine/renderers/html_renderer.py
View file @3e4aa63
+++ b/ReportEngine/renderers/html_renderer.py
View file @3e4aa63
@@ -13,6 +13,7 @@ class HTMLRenderer:
     """Document IR → HTML 渲染器"""
 
     def __init__(self, config: Dict[str, Any] | None = None):
+         """初始化渲染器缓存并允许注入额外配置（如主题覆盖）"""
         self.config = config or {}
         self.document: Dict[str, Any] = {}
         self.widget_scripts: List[str] = []
--- a/ReportEngine/utils/config.py
View file @3e4aa63
+++ b/ReportEngine/utils/config.py
View file @3e4aa63
 """
- Configuration management module for the Report Engine.
+ Report Engine 配置模块，统一读取环境变量并提供类型安全的访问方式。
 """
 
 import os
@@ -34,6 +34,7 @@ class Settings(BaseSettings):
     CHART_STYLE: str = Field("modern", description="图表样式：modern/classic/")
 
     class Config:
+         """Pydantic配置：允许从.env读取并兼容大小写"""
         env_file = ".env"
         env_prefix = ""
         case_sensitive = False
@@ -43,6 +44,7 @@ settings = Settings()
 
 
 def print_config(config: Settings):
+     """将当前配置项按人类可读格式输出到日志，方便排障"""
     message = ""
     message += "\n=== Report Engine 配置 ===\n"
     message += f"LLM 模型: {config.REPORT_ENGINE_MODEL_NAME}\n"