feat: 新增股票数据波形图和截图功能
refactor: 重构数据库和LLM分析器逻辑 fix: 修复爬虫解析和UI显示问题 docs: 更新配置文件和注释 style: 优化代码格式和日志输出
This commit is contained in:
181
main.py
181
main.py
@@ -2,11 +2,11 @@
|
||||
主程序入口 - 股吧人气指示器
|
||||
"""
|
||||
import sys
|
||||
import logging
|
||||
import time
|
||||
from datetime import datetime
|
||||
from PySide6.QtWidgets import QApplication
|
||||
from PySide6.QtCore import QTimer, Signal, QObject
|
||||
from PySide6.QtCore import QTimer, Signal, QObject, QThread
|
||||
from loguru import logger
|
||||
|
||||
from config_manager import ConfigManager
|
||||
from database import DatabaseManager
|
||||
@@ -20,8 +20,10 @@ class BackendWorker(QObject):
|
||||
|
||||
fetch_finished = Signal(list)
|
||||
analysis_finished = Signal(float)
|
||||
analysis_result = Signal(dict) # 传递分析结果详情
|
||||
error_occurred = Signal(str)
|
||||
status_update = Signal(str)
|
||||
stock_data_fetched = Signal(str, float) # 股票数据获取信号
|
||||
|
||||
def __init__(self, config_manager: ConfigManager, db_manager: DatabaseManager,
|
||||
spider: SpiderManager, analyzer: LLMAnalyzer):
|
||||
@@ -32,92 +34,136 @@ class BackendWorker(QObject):
|
||||
self.analyzer = analyzer
|
||||
self.running = False
|
||||
self.last_fetch_time = 0
|
||||
self.fetch_interval = 60 # 默认60秒
|
||||
self.fetch_interval = 15 # 默认15秒
|
||||
self.no_new_content_count = 0 # 无新内容计数
|
||||
self.is_running_cycle = False # 防止并发执行
|
||||
self.fetch_count = 0 # 爬取次数统计
|
||||
self.analysis_count = 0 # API分析次数统计
|
||||
logger.info("BackendWorker 初始化完成")
|
||||
|
||||
def start(self):
|
||||
"""启动后台任务"""
|
||||
self.running = True
|
||||
self._run_cycle()
|
||||
logger.info("后台任务已启动")
|
||||
# 启动时立即执行第一次任务
|
||||
QTimer.singleShot(1000, self._run_cycle)
|
||||
|
||||
def stop(self):
|
||||
"""停止后台任务"""
|
||||
self.running = False
|
||||
logger.info("后台任务已停止")
|
||||
|
||||
def _run_cycle(self):
|
||||
"""运行一个周期"""
|
||||
if self.is_running_cycle:
|
||||
logger.debug("上一个周期仍在执行,跳过本次")
|
||||
return
|
||||
|
||||
self.is_running_cycle = True
|
||||
|
||||
if not self.running:
|
||||
self.is_running_cycle = False
|
||||
return
|
||||
|
||||
try:
|
||||
# 1. 爬取评论
|
||||
logger.info("开始爬取评论")
|
||||
self.status_update.emit("正在爬取评论...")
|
||||
self.fetch_count += 1
|
||||
comments = self.spider.fetch()
|
||||
|
||||
if not comments:
|
||||
self.no_new_content_count += 1
|
||||
interval = self.fetch_interval * (1 + min(self.no_new_content_count * 0.5, 2))
|
||||
# 爬取失败,使用固定间隔重试,不计入无新内容计数
|
||||
interval = 15 # 固定15秒重试
|
||||
logger.warning(f"未获取到新评论,{int(interval)}秒后重试")
|
||||
self.status_update.emit(f"无新内容,{int(interval)}秒后重试...")
|
||||
self.is_running_cycle = False
|
||||
QTimer.singleShot(int(interval * 1000), self._run_cycle)
|
||||
return
|
||||
|
||||
# 2. 写入数据库
|
||||
logger.info(f"获取到 {len(comments)} 条评论")
|
||||
self.status_update.emit(f"获取到 {len(comments)} 条评论...")
|
||||
new_ids = self.db.add_comments_batch(comments)
|
||||
|
||||
if new_ids:
|
||||
self.no_new_content_count = 0
|
||||
logger.info(f"新增 {len(new_ids)} 条评论到数据库")
|
||||
self.status_update.emit(f"新增 {len(new_ids)} 条评论")
|
||||
|
||||
# 3. 获取未分析评论并分析
|
||||
unanalyzed = self.db.get_unanalyzed_comments(limit=10)
|
||||
logger.info(f"获取到 {len(unanalyzed)} 条未分析评论")
|
||||
|
||||
if unanalyzed:
|
||||
self.status_update.emit(f"开始分析 {len(unanalyzed)} 条评论...")
|
||||
self._analyze_comments(unanalyzed)
|
||||
else:
|
||||
self.no_new_content_count += 1
|
||||
logger.info("评论已存在,未新增")
|
||||
|
||||
# 4. 更新指示器
|
||||
self._update_indicator()
|
||||
|
||||
except Exception as e:
|
||||
logger.error(f"运行错误: {str(e)}")
|
||||
self.error_occurred.emit(f"运行错误: {str(e)}")
|
||||
|
||||
# 安排下一次执行
|
||||
if self.running:
|
||||
interval = self.fetch_interval * (1 + min(self.no_new_content_count * 0.5, 2))
|
||||
interval = self.fetch_interval * (1 + min(self.no_new_content_count * 1.0, 4.0))
|
||||
logger.debug(f"下次执行将在 {int(interval)} 秒后")
|
||||
self.is_running_cycle = False
|
||||
QTimer.singleShot(int(interval * 1000), self._run_cycle)
|
||||
else:
|
||||
self.is_running_cycle = False
|
||||
|
||||
def _analyze_comments(self, comments):
|
||||
"""分析评论"""
|
||||
logger.info(f"开始分析 {len(comments)} 条评论")
|
||||
for i, comment in enumerate(comments):
|
||||
if not self.running:
|
||||
logger.warning("分析被中断")
|
||||
break
|
||||
|
||||
try:
|
||||
self.status_update.emit(f"分析 {i+1}/{len(comments)}...")
|
||||
logger.debug(f"分析第 {i+1} 条评论: {comment['content'][:50]}...")
|
||||
self.analysis_count += 1
|
||||
score, label = self.analyzer.analyze(comment['content'])
|
||||
|
||||
# 获取分析结果详情
|
||||
last_result = self.analyzer.get_last_result()
|
||||
|
||||
if score is not None:
|
||||
self.db.mark_analyzed(comment['id'], score, label)
|
||||
logger.info(f"评论 {comment['id']} 分析完成: {score}分 - {label}")
|
||||
# 更新状态显示为简洁格式
|
||||
self.status_update.emit(f"分析 {i+1}/{len(comments)}...返回{score}分")
|
||||
# 每条评论分析完成后立即更新指示器
|
||||
self._update_indicator()
|
||||
time.sleep(1.0) # 延迟,避免API限流
|
||||
else:
|
||||
self.db.mark_analyzed(comment['id'], 50, "无法判断")
|
||||
logger.warning(f"评论 {comment['id']} 无法判断")
|
||||
|
||||
except Exception as e:
|
||||
logger.error(f"分析评论 {comment.get('id', 'unknown')} 失败: {str(e)}")
|
||||
self.error_occurred.emit(f"分析失败: {str(e)}")
|
||||
self.db.mark_analyzed(comment['id'], 50, "分析异常")
|
||||
|
||||
def _update_indicator(self):
|
||||
"""更新指示器显示"""
|
||||
scores = self.db.get_all_scores()
|
||||
# 获取最新的100条评论的分数
|
||||
scores = self.db.get_all_scores(limit=100)
|
||||
|
||||
if not scores:
|
||||
logger.debug("暂无分析分数")
|
||||
return
|
||||
|
||||
# 计算平均分
|
||||
avg_score = sum(scores) / len(scores)
|
||||
logger.info(f"当前平均分: {avg_score:.2f} (基于最新的 {len(scores)} 条评论)")
|
||||
|
||||
# 根据阈值确定标签
|
||||
thresholds = self.config.get('ui', 'thresholds', default={'cold': 30, 'warm': 70})
|
||||
@@ -131,68 +177,161 @@ class BackendWorker(QObject):
|
||||
else:
|
||||
label = "中性"
|
||||
|
||||
self.analysis_finished.emit(avg_score)
|
||||
logger.info(f"情感倾向: {label}")
|
||||
# 发送整数分数
|
||||
self.analysis_finished.emit(int(avg_score))
|
||||
|
||||
def fetch_stock_data(self):
|
||||
"""爬取股票数据并添加到波形图"""
|
||||
try:
|
||||
logger.info("开始爬取股票数据")
|
||||
stock_data = self.spider.fetch_sse_stock_data()
|
||||
|
||||
if stock_data and 'time' in stock_data and 'value' in stock_data:
|
||||
logger.info(f"成功获取股票数据: {stock_data}")
|
||||
# 发送股票数据到主窗口
|
||||
self.stock_data_fetched.emit(stock_data['time'], stock_data['value'])
|
||||
else:
|
||||
logger.warning("未能获取有效的股票数据")
|
||||
|
||||
except Exception as e:
|
||||
logger.error(f"爬取股票数据失败: {str(e)}")
|
||||
|
||||
def manual_refresh(self):
|
||||
"""手动刷新"""
|
||||
logger.info("用户手动刷新")
|
||||
self.no_new_content_count = 0
|
||||
self._run_cycle()
|
||||
if not self.is_running_cycle:
|
||||
self._run_cycle()
|
||||
else:
|
||||
logger.info("上一个周期仍在执行,跳过手动刷新")
|
||||
|
||||
def update_fetch_interval(self, interval: int):
|
||||
"""更新爬取间隔"""
|
||||
logger.info(f"更新爬取间隔: {interval} 秒")
|
||||
self.fetch_interval = interval
|
||||
|
||||
|
||||
def setup_logging(log_path: str, level: str = "INFO"):
|
||||
"""配置日志"""
|
||||
logging.basicConfig(
|
||||
level=getattr(logging, level.upper(), logging.INFO),
|
||||
format='%(asctime)s - %(levelname)s - %(message)s',
|
||||
handlers=[
|
||||
logging.FileHandler(log_path, encoding='utf-8'),
|
||||
logging.StreamHandler()
|
||||
]
|
||||
logger.remove() # 移除默认的处理器
|
||||
|
||||
logger.add(
|
||||
log_path,
|
||||
rotation="10 MB",
|
||||
retention="7 days",
|
||||
level=level,
|
||||
encoding="utf-8",
|
||||
format="{time:YYYY-MM-DD HH:mm:ss} | {level: <8} | {name}:{function}:{line} - {message}"
|
||||
)
|
||||
|
||||
logger.add(
|
||||
sys.stdout,
|
||||
level=level,
|
||||
format="<green>{time:YYYY-MM-DD HH:mm:ss}</green> | <level>{level: <8}</level> | <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message}</level>"
|
||||
)
|
||||
|
||||
|
||||
def main():
|
||||
"""主函数"""
|
||||
logger.info("=== 股吧人气指示器启动 ===")
|
||||
|
||||
# 创建应用
|
||||
app = QApplication(sys.argv)
|
||||
app.setQuitOnLastWindowClosed(False) # 允许最小化到托盘
|
||||
|
||||
# 加载配置
|
||||
logger.info("加载配置文件...")
|
||||
config = ConfigManager("config.json")
|
||||
|
||||
# 配置日志
|
||||
log_config = config.logging_config
|
||||
setup_logging(log_config.get('path', 'guba.log'), log_config.get('level', 'INFO'))
|
||||
logger.info(f"日志配置完成: {log_config.get('path', 'guba.log')}, 级别: {log_config.get('level', 'INFO')}")
|
||||
|
||||
# 初始化组件
|
||||
logger.info("初始化数据库...")
|
||||
db = DatabaseManager(config.database_config.get('path', 'guba.db'))
|
||||
|
||||
logger.info("初始化爬虫...")
|
||||
spider = SpiderManager(config.spider_config)
|
||||
|
||||
logger.info("初始化LLM分析器...")
|
||||
analyzer = LLMAnalyzer(config.llm_api_config)
|
||||
|
||||
# 创建后台工作器
|
||||
worker = BackendWorker(config, db, spider, analyzer)
|
||||
worker.update_fetch_interval(config.spider_config.get('fetch_interval', 60))
|
||||
worker.update_fetch_interval(config.spider_config.get('fetch_interval', 15))
|
||||
|
||||
# 创建后台线程
|
||||
logger.info("创建后台线程...")
|
||||
worker_thread = QThread()
|
||||
worker.moveToThread(worker_thread)
|
||||
|
||||
# 线程启动时开始工作
|
||||
worker_thread.started.connect(worker.start)
|
||||
# 线程结束时停止工作
|
||||
worker_thread.finished.connect(worker.stop)
|
||||
|
||||
# 创建主窗口
|
||||
window = MainWindow(config)
|
||||
logger.info("创建主窗口...")
|
||||
window = MainWindow(config, spider)
|
||||
window.show()
|
||||
|
||||
# 连接信号
|
||||
worker.status_update.connect(window.update_status)
|
||||
worker.analysis_finished.connect(window.update_indicator)
|
||||
worker.error_occurred.connect(lambda msg: window.show_message("错误", msg))
|
||||
worker.stock_data_fetched.connect(window.add_waveform_data)
|
||||
|
||||
# 启动时从数据库初始化指示器显示
|
||||
worker._update_indicator()
|
||||
logger.info("初始化指示器显示完成")
|
||||
|
||||
# 设置按钮回调
|
||||
window.set_refresh_callback(worker.manual_refresh)
|
||||
window.set_config_callback(window.show_config)
|
||||
|
||||
# 启动后台任务
|
||||
worker.start()
|
||||
# 启动后台线程
|
||||
worker_thread.start()
|
||||
logger.info("后台线程已启动")
|
||||
|
||||
# 启动股票数据爬取定时器
|
||||
stock_timer = QTimer()
|
||||
stock_timer.timeout.connect(worker.fetch_stock_data)
|
||||
stock_timer.start(60000) # 每分钟爬取一次股票数据
|
||||
logger.info("股票数据爬取定时器已启动,间隔60秒")
|
||||
|
||||
# 确保应用退出时清理线程
|
||||
def cleanup():
|
||||
logger.info("清理资源,停止后台线程...")
|
||||
worker.stop()
|
||||
worker_thread.quit()
|
||||
worker_thread.wait()
|
||||
|
||||
# 显示统计信息
|
||||
logger.info("=== 程序运行统计 ===")
|
||||
logger.info(f"爬取网站次数: {worker.fetch_count}")
|
||||
logger.info(f"提交API分析次数: {worker.analysis_count}")
|
||||
logger.info("=== 统计结束 ===")
|
||||
|
||||
# 写入统计信息到文件
|
||||
try:
|
||||
stats_file = "statistics.txt"
|
||||
with open(stats_file, "a", encoding="utf-8") as f:
|
||||
f.write(f"=== 程序运行统计 - {datetime.now().strftime('%Y-%m-%d %H:%M:%S')} ===\n")
|
||||
f.write(f"爬取网站次数: {worker.fetch_count}\n")
|
||||
f.write(f"提交API分析次数: {worker.analysis_count}\n")
|
||||
f.write("=== 统计结束 ===\n\n")
|
||||
logger.info(f"统计信息已写入到文件: {stats_file}")
|
||||
except Exception as e:
|
||||
logger.error(f"写入统计文件失败: {str(e)}")
|
||||
|
||||
logger.info("后台线程已停止")
|
||||
|
||||
app.aboutToQuit.connect(cleanup)
|
||||
|
||||
logger.info("应用启动完成,进入主循环")
|
||||
# 运行应用
|
||||
sys.exit(app.exec())
|
||||
|
||||
|
||||
Reference in New Issue
Block a user