feat: 初始化项目结构并添加核心功能模块

- 新增文档模板和导航结构
- 实现服务器基础API路由和控制器
- 添加扩展插件配置和前端框架
- 引入多租户和权限管理模块
- 集成日志和数据库配置
- 添加核心业务模型和类型定义
This commit is contained in:
2026-03-17 22:07:19 +08:00
parent c0870dce50
commit 136c2fa579
728 changed files with 107690 additions and 5614 deletions

View File

@@ -0,0 +1,115 @@
import { Job } from 'bullmq';
import { WorkerHub } from './WorkerHub';
import { CrawlerService } from '../services/CrawlerService';
import { AIService } from '../services/AIService';
import { FingerprintEngine } from '../core/ai/FingerprintEngine';
import { ProductService } from '../services/ProductService';
import { AuditService } from '../services/AuditService';
import { logger } from '../utils/logger';
/**
* [CORE_WORK_01] 采集 Worker (Crawler Worker)
* @description 异步执行产品抓取、多模态解析、指纹生成并入库,支持任务追踪与审计
*/
export class CrawlerWorker {
private static QUEUE_NAME = 'crawler-tasks';
/**
* 初始化并注册 Worker
*/
static init() {
WorkerHub.registerWorker(this.QUEUE_NAME, async (job: Job) => {
const { url, sandbox, traceContext } = job.data;
const { tenantId, shopId, taskId, traceId, userId } = traceContext;
logger.info(`[CrawlerWorker] Starting task ${job.id} for URL: ${url}`);
try {
// 1. 抓取
let productData = await CrawlerService.crawlProduct(url, { useSandbox: sandbox });
// 2. 多模态优化
const optimized = await AIService.analyzeMultiModalProduct({
title: productData.title || '',
description: productData.description,
attributes: productData.attributes || {},
imageUrls: productData.images || []
});
productData.title = optimized.optimizedTitle;
productData.description = optimized.optimizedDescription;
productData.attributes = { ...productData.attributes, ...optimized.validatedAttributes };
// 3. 指纹生成
const fingerprint = await FingerprintEngine.generateCompositeFingerprint({
title: productData.title,
description: productData.description,
mainImage: productData.mainImage || ''
});
// 4. 入库
const id = await ProductService.create({
...productData,
phash: fingerprint.phash,
semanticHash: fingerprint.semanticHash,
vectorEmbedding: JSON.stringify(fingerprint.vectorEmbedding),
status: 'draft'
});
// 5. 审计日志
await AuditService.log({
tenantId,
shopId,
taskId,
traceId,
userId,
module: 'SYNC',
action: 'CRAWLER_ASYNC_COMPLETE',
resourceType: 'product',
resourceId: String(id),
afterSnapshot: { url, id },
result: 'success',
source: 'node'
});
return { id, url, status: 'completed' };
} catch (err: any) {
logger.error(`[CrawlerWorker] Task ${job.id} failed: ${err.message}`);
// 错误审计
await AuditService.log({
tenantId,
shopId,
taskId,
traceId,
userId,
module: 'SYNC',
action: 'CRAWLER_ASYNC_FAILED',
resourceType: 'product',
resourceId: url,
result: 'failed',
errorCode: 'CRAWLER_WORKER_ERROR',
errorMessage: err.message,
source: 'node'
});
throw err;
}
}, 10); // 并发数限制为 10
}
/**
* 提交采集任务到队列
*/
static async submit(data: {
url: string;
sandbox?: boolean;
traceContext: any;
}) {
const queue = WorkerHub.getQueue(this.QUEUE_NAME);
return await queue.add(`crawl-${Date.now()}`, data, {
attempts: 3,
backoff: { type: 'exponential', delay: 1000 }
});
}
}