feat(backend): add batch processing and review tasks modules

- Add Prisma migrations for batch processing tables
- Add Prisma migrations for review tasks tables
- Add seed data for testing
- Add prompt templates for review (editorial, methodology)
- Add CloseAI configuration guide
- Add database validation scripts
This commit is contained in:
2025-11-16 15:43:04 +08:00
parent 0c5310fb77
commit 5579ffa78e
9 changed files with 1611 additions and 0 deletions

View File

@@ -0,0 +1,151 @@
-- AlterTable
ALTER TABLE "documents" ADD COLUMN "char_count" INTEGER,
ADD COLUMN "extracted_text" TEXT,
ADD COLUMN "extraction_method" TEXT,
ADD COLUMN "extraction_quality" DOUBLE PRECISION,
ADD COLUMN "language" TEXT;
-- CreateTable
CREATE TABLE "batch_tasks" (
"id" TEXT NOT NULL,
"user_id" TEXT NOT NULL,
"kb_id" TEXT NOT NULL,
"name" TEXT NOT NULL,
"template_type" TEXT NOT NULL,
"template_id" TEXT,
"prompt" TEXT NOT NULL,
"status" TEXT NOT NULL,
"total_documents" INTEGER NOT NULL,
"completed_count" INTEGER NOT NULL DEFAULT 0,
"failed_count" INTEGER NOT NULL DEFAULT 0,
"model_type" TEXT NOT NULL,
"concurrency" INTEGER NOT NULL DEFAULT 3,
"started_at" TIMESTAMP(3),
"completed_at" TIMESTAMP(3),
"duration_seconds" INTEGER,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updated_at" TIMESTAMP(3) NOT NULL,
CONSTRAINT "batch_tasks_pkey" PRIMARY KEY ("id")
);
-- CreateTable
CREATE TABLE "batch_results" (
"id" TEXT NOT NULL,
"task_id" TEXT NOT NULL,
"document_id" TEXT NOT NULL,
"status" TEXT NOT NULL,
"data" JSONB,
"rawOutput" TEXT,
"error_message" TEXT,
"processing_time_ms" INTEGER,
"tokens_used" INTEGER,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "batch_results_pkey" PRIMARY KEY ("id")
);
-- CreateTable
CREATE TABLE "task_templates" (
"id" TEXT NOT NULL,
"user_id" TEXT NOT NULL,
"name" TEXT NOT NULL,
"description" TEXT,
"prompt" TEXT NOT NULL,
"outputFields" JSONB NOT NULL,
"is_public" BOOLEAN NOT NULL DEFAULT false,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updated_at" TIMESTAMP(3) NOT NULL,
CONSTRAINT "task_templates_pkey" PRIMARY KEY ("id")
);
-- CreateTable
CREATE TABLE "general_conversations" (
"id" TEXT NOT NULL,
"user_id" TEXT NOT NULL,
"title" TEXT NOT NULL,
"model_name" TEXT,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updated_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"deleted_at" TIMESTAMP(3),
CONSTRAINT "general_conversations_pkey" PRIMARY KEY ("id")
);
-- CreateTable
CREATE TABLE "general_messages" (
"id" TEXT NOT NULL,
"conversation_id" TEXT NOT NULL,
"role" TEXT NOT NULL,
"content" TEXT NOT NULL,
"model" TEXT,
"metadata" JSONB,
"tokens" INTEGER,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "general_messages_pkey" PRIMARY KEY ("id")
);
-- CreateIndex
CREATE INDEX "batch_tasks_user_id_idx" ON "batch_tasks"("user_id");
-- CreateIndex
CREATE INDEX "batch_tasks_kb_id_idx" ON "batch_tasks"("kb_id");
-- CreateIndex
CREATE INDEX "batch_tasks_status_idx" ON "batch_tasks"("status");
-- CreateIndex
CREATE INDEX "batch_tasks_created_at_idx" ON "batch_tasks"("created_at");
-- CreateIndex
CREATE INDEX "batch_results_task_id_idx" ON "batch_results"("task_id");
-- CreateIndex
CREATE INDEX "batch_results_document_id_idx" ON "batch_results"("document_id");
-- CreateIndex
CREATE INDEX "batch_results_status_idx" ON "batch_results"("status");
-- CreateIndex
CREATE INDEX "task_templates_user_id_idx" ON "task_templates"("user_id");
-- CreateIndex
CREATE INDEX "general_conversations_user_id_idx" ON "general_conversations"("user_id");
-- CreateIndex
CREATE INDEX "general_conversations_created_at_idx" ON "general_conversations"("created_at");
-- CreateIndex
CREATE INDEX "general_conversations_updated_at_idx" ON "general_conversations"("updated_at");
-- CreateIndex
CREATE INDEX "general_messages_conversation_id_idx" ON "general_messages"("conversation_id");
-- CreateIndex
CREATE INDEX "general_messages_created_at_idx" ON "general_messages"("created_at");
-- CreateIndex
CREATE INDEX "documents_extraction_method_idx" ON "documents"("extraction_method");
-- AddForeignKey
ALTER TABLE "batch_tasks" ADD CONSTRAINT "batch_tasks_user_id_fkey" FOREIGN KEY ("user_id") REFERENCES "users"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "batch_tasks" ADD CONSTRAINT "batch_tasks_kb_id_fkey" FOREIGN KEY ("kb_id") REFERENCES "knowledge_bases"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "batch_results" ADD CONSTRAINT "batch_results_task_id_fkey" FOREIGN KEY ("task_id") REFERENCES "batch_tasks"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "batch_results" ADD CONSTRAINT "batch_results_document_id_fkey" FOREIGN KEY ("document_id") REFERENCES "documents"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "task_templates" ADD CONSTRAINT "task_templates_user_id_fkey" FOREIGN KEY ("user_id") REFERENCES "users"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "general_conversations" ADD CONSTRAINT "general_conversations_user_id_fkey" FOREIGN KEY ("user_id") REFERENCES "users"("id") ON DELETE CASCADE ON UPDATE CASCADE;
-- AddForeignKey
ALTER TABLE "general_messages" ADD CONSTRAINT "general_messages_conversation_id_fkey" FOREIGN KEY ("conversation_id") REFERENCES "general_conversations"("id") ON DELETE CASCADE ON UPDATE CASCADE;

View File

@@ -0,0 +1,35 @@
-- CreateTable
CREATE TABLE "review_tasks" (
"id" TEXT NOT NULL,
"user_id" TEXT NOT NULL,
"file_name" TEXT NOT NULL,
"file_size" INTEGER NOT NULL,
"file_path" TEXT,
"extracted_text" TEXT NOT NULL,
"word_count" INTEGER,
"status" TEXT NOT NULL DEFAULT 'pending',
"editorial_review" JSONB,
"methodology_review" JSONB,
"overall_score" DOUBLE PRECISION,
"model_used" TEXT,
"started_at" TIMESTAMP(3),
"completed_at" TIMESTAMP(3),
"duration_seconds" INTEGER,
"error_message" TEXT,
"created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updated_at" TIMESTAMP(3) NOT NULL,
CONSTRAINT "review_tasks_pkey" PRIMARY KEY ("id")
);
-- CreateIndex
CREATE INDEX "review_tasks_user_id_idx" ON "review_tasks"("user_id");
-- CreateIndex
CREATE INDEX "review_tasks_status_idx" ON "review_tasks"("status");
-- CreateIndex
CREATE INDEX "review_tasks_created_at_idx" ON "review_tasks"("created_at");
-- AddForeignKey
ALTER TABLE "review_tasks" ADD CONSTRAINT "review_tasks_user_id_fkey" FOREIGN KEY ("user_id") REFERENCES "users"("id") ON DELETE CASCADE ON UPDATE CASCADE;

109
backend/prisma/seed.ts Normal file
View File

@@ -0,0 +1,109 @@
/**
* 数据库种子数据脚本
* 用于初始化开发环境的测试用户
*/
import { PrismaClient } from '@prisma/client';
const prisma = new PrismaClient();
async function main() {
console.log('🌱 开始初始化数据库种子数据...');
// 创建测试用户
const mockUser = await prisma.user.upsert({
where: { id: 'user-mock-001' },
update: {},
create: {
id: 'user-mock-001',
email: 'test@example.com',
password: '$2b$12$LQv3c1yqBWVHxkd0LHAkCOYz6TtxMQJqhN8/LewY5GyYIkYvKx7ES', // password: "password123"
name: '测试用户',
role: 'user',
status: 'active',
kbQuota: 3,
kbUsed: 0,
isTrial: true,
trialEndsAt: new Date(Date.now() + 30 * 24 * 60 * 60 * 1000), // 30天后
},
});
console.log('✅ 测试用户创建成功:', {
id: mockUser.id,
email: mockUser.email,
name: mockUser.name,
});
// 可选:创建管理员用户
const adminUser = await prisma.user.upsert({
where: { email: 'admin@example.com' },
update: {},
create: {
id: 'user-admin-001',
email: 'admin@example.com',
password: '$2b$12$LQv3c1yqBWVHxkd0LHAkCOYz6TtxMQJqhN8/LewY5GyYIkYvKx7ES', // password: "password123"
name: '管理员',
role: 'admin',
status: 'active',
kbQuota: 10,
kbUsed: 0,
isTrial: false,
},
});
console.log('✅ 管理员用户创建成功:', {
id: adminUser.id,
email: adminUser.email,
name: adminUser.name,
});
console.log('\n🎉 数据库种子数据初始化完成!\n');
console.log('📝 测试账号信息:');
console.log(' 邮箱: test@example.com');
console.log(' 密码: password123');
console.log(' 用户ID: user-mock-001\n');
console.log('📝 管理员账号信息:');
console.log(' 邮箱: admin@example.com');
console.log(' 密码: password123');
console.log(' 用户ID: user-admin-001\n');
}
main()
.catch((e) => {
console.error('❌ 初始化种子数据失败:', e);
process.exit(1);
})
.finally(async () => {
await prisma.$disconnect();
});