monitor.py
12.5 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
"""
日志监控器 - 实时监控三个log文件中的SummaryNode和ReportFormattingNode输出
"""
import os
import time
import threading
from pathlib import Path
from datetime import datetime
import re
from typing import Dict, Optional, List
from threading import Lock
class LogMonitor:
"""基于文件变化的智能日志监控器"""
def __init__(self, log_dir: str = "logs"):
"""初始化日志监控器"""
self.log_dir = Path(log_dir)
self.forum_log_file = self.log_dir / "forum.log"
# 要监控的日志文件
self.monitored_logs = {
'insight': self.log_dir / 'insight.log',
'media': self.log_dir / 'media.log',
'query': self.log_dir / 'query.log'
}
# 监控状态
self.is_monitoring = False
self.monitor_thread = None
self.file_positions = {} # 记录每个文件的读取位置
self.file_line_counts = {} # 记录每个文件的行数
self.is_searching = False # 是否正在搜索
self.search_inactive_count = 0 # 搜索非活跃计数器
self.write_lock = Lock() # 写入锁,防止并发写入冲突
# 目标节点名称 - 直接匹配字符串
self.target_nodes = [
'FirstSummaryNode',
'ReflectionSummaryNode',
'ReportFormattingNode'
]
# 确保logs目录存在
self.log_dir.mkdir(exist_ok=True)
def clear_forum_log(self):
"""清空forum.log文件"""
try:
if self.forum_log_file.exists():
self.forum_log_file.unlink()
# 创建新的forum.log文件并写入开始标记
with open(self.forum_log_file, 'w', encoding='utf-8') as f:
start_time = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
f.write(f"=== ForumEgine 监控开始 - {start_time} ===\n")
print(f"ForumEgine: forum.log 已清空并初始化")
except Exception as e:
print(f"ForumEgine: 清空forum.log失败: {e}")
def write_to_forum_log(self, content: str):
"""写入内容到forum.log(线程安全)"""
try:
with self.write_lock: # 使用锁确保线程安全
with open(self.forum_log_file, 'a', encoding='utf-8') as f:
timestamp = datetime.now().strftime('%H:%M:%S')
f.write(f"[{timestamp}] {content}\n")
f.flush()
except Exception as e:
print(f"ForumEgine: 写入forum.log失败: {e}")
def is_target_log_line(self, line: str) -> bool:
"""检查是否是目标日志行(SummaryNode或ReportFormattingNode)"""
# 简单字符串包含检查,更可靠
for node_name in self.target_nodes:
if node_name in line:
return True
return False
def extract_node_content(self, line: str) -> Optional[str]:
"""提取节点内容"""
# 移除时间戳部分,保留节点名称和消息
# 格式: [HH:MM:SS] [NodeName] message
match = re.search(r'\[\d{2}:\d{2}:\d{2}\]\s*(.+)', line)
if match:
return match.group(1).strip()
return line.strip()
def get_file_size(self, file_path: Path) -> int:
"""获取文件大小"""
try:
return file_path.stat().st_size if file_path.exists() else 0
except:
return 0
def get_file_line_count(self, file_path: Path) -> int:
"""获取文件行数"""
try:
if not file_path.exists():
return 0
with open(file_path, 'r', encoding='utf-8') as f:
return sum(1 for _ in f)
except:
return 0
# 移除这个方法,逻辑已经合并到monitor_logs中
def read_new_lines(self, file_path: Path, app_name: str) -> List[str]:
"""读取文件中的新行"""
new_lines = []
try:
if not file_path.exists():
return new_lines
current_size = self.get_file_size(file_path)
last_position = self.file_positions.get(app_name, 0)
# 如果文件变小了,说明被清空了,重新从头开始
if current_size < last_position:
last_position = 0
if current_size > last_position:
with open(file_path, 'r', encoding='utf-8') as f:
f.seek(last_position)
new_content = f.read()
new_lines = new_content.split('\n')
# 更新位置
self.file_positions[app_name] = f.tell()
# 过滤空行
new_lines = [line.strip() for line in new_lines if line.strip()]
except Exception as e:
print(f"ForumEgine: 读取{app_name}日志失败: {e}")
return new_lines
def monitor_logs(self):
"""智能监控日志文件"""
print("ForumEgine: 开始智能监控日志文件...")
# 初始化文件行数和位置 - 记录当前状态作为基线
for app_name, log_file in self.monitored_logs.items():
self.file_line_counts[app_name] = self.get_file_line_count(log_file)
self.file_positions[app_name] = self.get_file_size(log_file)
print(f"ForumEgine: {app_name} 基线行数: {self.file_line_counts[app_name]}")
while self.is_monitoring:
try:
# 同时检测三个log文件的变化
any_growth = False
any_shrink = False
captured_any = False
# 为每个log文件独立处理
for app_name, log_file in self.monitored_logs.items():
current_lines = self.get_file_line_count(log_file)
previous_lines = self.file_line_counts.get(app_name, 0)
if current_lines > previous_lines:
any_growth = True
# 立即读取新增内容
new_lines = self.read_new_lines(log_file, app_name)
# 先检查是否需要触发搜索(只触发一次)
if not self.is_searching:
for line in new_lines:
if line.strip() and 'FirstSummaryNode' in line:
print(f"ForumEgine: 在{app_name}中检测到FirstSummaryNode,开始监控记录")
self.is_searching = True
self.search_inactive_count = 0
# 清空forum.log开始新会话
self.clear_forum_log()
break # 找到一个就够了,跳出循环
# 处理所有新增内容(如果正在搜索状态)
if self.is_searching:
for line in new_lines:
if line.strip() and self.is_target_log_line(line):
# 立即记录目标节点输出
formatted_content = f"[{app_name.upper()}] {line.strip()}"
self.write_to_forum_log(formatted_content)
print(f"ForumEgine: 捕获 - {formatted_content}")
captured_any = True
elif current_lines < previous_lines:
any_shrink = True
print(f"ForumEgine: 检测到 {app_name} 日志缩短,将重置基线")
# 重置文件位置到新的文件末尾
self.file_positions[app_name] = self.get_file_size(log_file)
# 更新行数记录
self.file_line_counts[app_name] = current_lines
# 检查是否应该结束当前搜索会话
if self.is_searching:
if any_shrink:
# log变短,结束当前搜索会话,重置为等待状态
print("ForumEgine: 日志缩短,结束当前搜索会话,回到等待状态")
self.is_searching = False
self.search_inactive_count = 0
# 写入结束标记
end_time = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
self.write_to_forum_log(f"=== ForumEgine 搜索会话结束 - {end_time} ===")
print("ForumEgine: 已重置基线,等待下次FirstSummaryNode触发")
elif not any_growth and not captured_any:
# 没有增长也没有捕获内容,增加非活跃计数
self.search_inactive_count += 1
if self.search_inactive_count >= 30: # 30秒无活动才结束
print("ForumEgine: 长时间无活动,结束搜索会话")
self.is_searching = False
self.search_inactive_count = 0
# 写入结束标记
end_time = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
self.write_to_forum_log(f"=== ForumEgine 搜索会话超时结束 - {end_time} ===")
else:
self.search_inactive_count = 0 # 重置计数器
# 短暂休眠
time.sleep(1)
except Exception as e:
print(f"ForumEgine: 监控过程中出错: {e}")
import traceback
traceback.print_exc()
time.sleep(2)
print("ForumEgine: 停止监控日志文件")
def start_monitoring(self):
"""开始智能监控"""
if self.is_monitoring:
print("ForumEgine: 监控已经在运行中")
return False
try:
# 启动监控
self.is_monitoring = True
self.monitor_thread = threading.Thread(target=self.monitor_logs, daemon=True)
self.monitor_thread.start()
print("ForumEgine: 智能监控已启动")
return True
except Exception as e:
print(f"ForumEgine: 启动监控失败: {e}")
self.is_monitoring = False
return False
def stop_monitoring(self):
"""停止监控"""
if not self.is_monitoring:
print("ForumEgine: 监控未运行")
return
try:
self.is_monitoring = False
if self.monitor_thread and self.monitor_thread.is_alive():
self.monitor_thread.join(timeout=2)
# 写入结束标记
end_time = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
self.write_to_forum_log(f"=== ForumEgine 监控结束 - {end_time} ===")
print("ForumEgine: 监控已停止")
except Exception as e:
print(f"ForumEgine: 停止监控失败: {e}")
def get_forum_log_content(self) -> List[str]:
"""获取forum.log的内容"""
try:
if not self.forum_log_file.exists():
return []
with open(self.forum_log_file, 'r', encoding='utf-8') as f:
return [line.rstrip('\n\r') for line in f.readlines()]
except Exception as e:
print(f"ForumEgine: 读取forum.log失败: {e}")
return []
# 全局监控器实例
_monitor_instance = None
def get_monitor() -> LogMonitor:
"""获取全局监控器实例"""
global _monitor_instance
if _monitor_instance is None:
_monitor_instance = LogMonitor()
return _monitor_instance
def start_forum_monitoring():
"""启动ForumEgine智能监控"""
return get_monitor().start_monitoring()
def stop_forum_monitoring():
"""停止ForumEgine监控"""
get_monitor().stop_monitoring()
def get_forum_log():
"""获取forum.log内容"""
return get_monitor().get_forum_log_content()