后端重构: - 新增分层架构:API Routes -> Services -> Repositories -> Infrastructure - 彻底移除全局单例,全面采用 FastAPI 依赖注入 - 新增 api/ 目录拆分路由(proxies, plugins, scheduler, settings, stats) - 新增 services/ 业务逻辑层:ProxyService, PluginService, SchedulerService, ValidatorService, SettingsService - 新增 repositories/ 数据访问层:ProxyRepository, SettingsRepository, PluginSettingsRepository - 新增 models/ 层:Pydantic Schemas + Domain Models - 重写 core/config.py:采用 Pydantic Settings 管理配置 - 新增 core/db.py:基于 asynccontextmanager 的连接管理,支持数据库迁移 - 新增 core/exceptions.py:统一业务异常体系 插件系统重构(核心): - 新增 core/plugin_system/:BaseCrawlerPlugin + PluginRegistry - 采用显式注册模式(装饰器 + plugins/__init__.py),类型安全、测试友好 - 新增 plugins/base.py:BaseHTTPPlugin 通用 HTTP 爬虫基类 - 迁移全部 7 个插件到新架构(fate0, proxylist_download, ip3366, ip89, kuaidaili, speedx, yundaili) - 插件状态持久化到 plugin_settings 表 任务调度重构: - 新增 core/tasks/queue.py:ValidationQueue + WorkerPool - 解耦爬取与验证:爬虫只负责爬取,代理提交队列后由 Worker 异步验证 - 调度器定时从数据库拉取存量代理并分批投入验证队列 前端调整: - 新增 frontend/src/services/ 层拆分 API 调用逻辑 - 调整 stores/ 和 views/ 使用 Service 层 - 保持 API 兼容性,页面无需大幅修改 其他: - 新增 main.py 作为新入口 - 新增 DESIGN.md 架构设计文档 - 更新 requirements.txt 增加 pydantic-settings
78 lines
3.1 KiB
Python
78 lines
3.1 KiB
Python
"""插件注册中心 - 显式注册,类型安全,测试友好"""
|
||
import importlib
|
||
import inspect
|
||
import os
|
||
from typing import Dict, List, Type, Optional
|
||
from core.plugin_system.base import BaseCrawlerPlugin
|
||
from core.log import logger
|
||
|
||
|
||
class PluginRegistry:
|
||
"""插件注册中心"""
|
||
|
||
def __init__(self):
|
||
self._plugins: Dict[str, Type[BaseCrawlerPlugin]] = {}
|
||
self._instances: Dict[str, BaseCrawlerPlugin] = {}
|
||
|
||
def register(self, plugin_cls: Type[BaseCrawlerPlugin]) -> Type[BaseCrawlerPlugin]:
|
||
"""注册一个插件类。支持装饰器语法。"""
|
||
if not inspect.isclass(plugin_cls) or not issubclass(plugin_cls, BaseCrawlerPlugin):
|
||
raise ValueError("Plugin must be a subclass of BaseCrawlerPlugin")
|
||
if not plugin_cls.name:
|
||
raise ValueError(f"Plugin {plugin_cls.__name__} must have a 'name' attribute")
|
||
|
||
self._plugins[plugin_cls.name] = plugin_cls
|
||
logger.info(f"Plugin registered: {plugin_cls.name} ({plugin_cls.__name__})")
|
||
return plugin_cls
|
||
|
||
def get(self, name: str) -> Optional[BaseCrawlerPlugin]:
|
||
"""获取插件实例(懒加载)"""
|
||
if name not in self._instances:
|
||
cls = self._plugins.get(name)
|
||
if cls:
|
||
self._instances[name] = cls()
|
||
return self._instances.get(name)
|
||
|
||
def list_plugins(self) -> List[BaseCrawlerPlugin]:
|
||
"""获取所有已注册插件的实例列表"""
|
||
result = []
|
||
for name in self._plugins:
|
||
instance = self.get(name)
|
||
if instance:
|
||
result.append(instance)
|
||
return result
|
||
|
||
def get_plugin_names(self) -> List[str]:
|
||
return list(self._plugins.keys())
|
||
|
||
def auto_discover(self, package_name: str):
|
||
"""自动扫描指定包下的所有模块并注册其中的插件类。
|
||
注意:为了类型安全和可控性,推荐显式注册。auto_discover 仅作为兼容。"""
|
||
try:
|
||
package = importlib.import_module(package_name)
|
||
package_dir = os.path.dirname(package.__file__)
|
||
except Exception as e:
|
||
logger.error(f"Auto discover failed for package {package_name}: {e}")
|
||
return
|
||
|
||
for filename in os.listdir(package_dir):
|
||
if filename.endswith(".py") and not filename.startswith("__"):
|
||
module_name = f"{package_name}.{filename[:-3]}"
|
||
try:
|
||
module = importlib.import_module(module_name)
|
||
for attr_name in dir(module):
|
||
obj = getattr(module, attr_name)
|
||
if (
|
||
inspect.isclass(obj)
|
||
and issubclass(obj, BaseCrawlerPlugin)
|
||
and obj is not BaseCrawlerPlugin
|
||
and obj not in self._plugins.values()
|
||
):
|
||
self.register(obj)
|
||
except Exception as e:
|
||
logger.error(f"Failed to load module {module_name}: {e}")
|
||
|
||
|
||
# 全局注册中心实例
|
||
registry = PluginRegistry()
|