Reset loaded_states per task to prevent cross-task leakage

马一丁
Commit 1560df2d6dc240fe2844435ed1a9dc1f815edc69 1560df2d 1 parent 30aa7f45
Showing 1 changed file with 11 additions and 10 deletions
ReportEngine/agent.py
--- a/ReportEngine/agent.py
View file @1560df2
+++ b/ReportEngine/agent.py
View file @1560df2
@@ -240,6 +240,9 @@ class ReportAgent:
         # 状态
         self.state = ReportState()
         
+         # GraphRAG 状态数据（每次 load_input_files 时重置）
+         self._loaded_states = {}
+         
         # 确保输出目录存在
         os.makedirs(self.config.OUTPUT_DIR, exist_ok=True)
         os.makedirs(self.config.DOCUMENT_IR_OUTPUT_DIR, exist_ok=True)
@@ -901,16 +904,14 @@ class ReportAgent:
             Graph: 构建好的知识图谱；失败返回 None。
         """
         try:
-             # 解析 State JSON（如果在 load_input_files 时已加载）
-             states = {}
-             state_parser = StateParser()
-             
-             # 尝试从 reports 目录查找 State JSON
-             # 注意：这里假设 reports 字典的键对应引擎目录
-             for engine in ['insight', 'media', 'query']:
-                 # 尝试从全局状态获取（如果之前已加载）
-                 if hasattr(self, '_loaded_states') and engine in self._loaded_states:
-                     states[engine] = self._loaded_states[engine]
+             # 直接使用 load_input_files 中加载的 State JSON
+             # 注意：_loaded_states 在每次 load_input_files 调用时会被重置，
+             # 确保不会有跨任务的数据泄漏
+             states = {
+                 engine: state
+                 for engine, state in self._loaded_states.items()
+                 if engine in ['insight', 'media', 'query']
+             }
             
             # 解析论坛日志
             forum_entries = []