Corrections critiques:
- Fix titre HTML {{project_title}} -> %VITE_APP_TITLE%
- Suppression vitePluginManusRuntime (360KB -> 4KB index.html)
- Upload vidéo: multer au lieu du parsing binary maison (anti-corruption)
- Extraction audio ffmpeg + sauvegarde sourceAudioUrl en DB
- Page /login dédiée + correction redirect auth
- Test moteurs IA: vrai HEAD request avec latence
- Suppression spam logs [Auth] Missing session cookie
- Fix fuite passwordHash dans auth.me
- Cookie sameSite: none -> lax (CSRF)
Sécurité:
- Endpoints admin protégés par adminProcedure (role=admin requis)
- Sidebar admin masquée pour non-admins
- AdminPanel: page accès refusé pour non-admins
- Bootstrap admin optimisé (skip rehash si identique)
Fonctionnalités:
- Export vidéo MP4 réel via ffmpeg local (H.264 + AAC audio)
- Download parallèle par batch de 20 (export 10x plus rapide)
- Détection de scènes réelle via ffmpeg scene detect
- Analyse arrière-plans via Gemini Vision (remplace Math.random)
- Gemini: conservation du role system + support image_url
- Suppression thinking.budget_tokens:128 (LLM config)
- Thumbnails de frames dans la timeline
- Toast export avec bouton télécharger
- Endpoint extraction audio à la demande
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
549 lines
18 KiB
TypeScript
549 lines
18 KiB
TypeScript
/**
|
|
* AI Operator Assistant Service
|
|
* Autonomous assistant that can orchestrate the entire recomposition pipeline
|
|
*
|
|
* Capabilities:
|
|
* - Detect static background sequences
|
|
* - Select optimal reference frames
|
|
* - Orchestrate segmentation pipeline
|
|
* - Guide user through the process in natural language
|
|
* - Execute batch operations autonomously when configured
|
|
*/
|
|
|
|
import { invokeLLM } from "./_core/llm";
|
|
import * as db from "./db";
|
|
import * as videoProcessor from "./videoProcessor";
|
|
import * as segmentation from "./segmentationService";
|
|
|
|
export type AssistantAction =
|
|
| "detect_scenes"
|
|
| "analyze_backgrounds"
|
|
| "select_references"
|
|
| "segment_characters"
|
|
| "inpaint_backgrounds"
|
|
| "regenerate_backgrounds"
|
|
| "regenerate_characters"
|
|
| "composite_all"
|
|
| "full_auto";
|
|
|
|
export interface PipelineStatus {
|
|
currentStep: string;
|
|
progress: number;
|
|
totalSteps: number;
|
|
message: string;
|
|
}
|
|
|
|
/**
|
|
* Execute the full autonomous pipeline for a project
|
|
*/
|
|
export async function runAutonomousPipeline(
|
|
projectId: number,
|
|
action: AssistantAction,
|
|
options: {
|
|
backgroundPrompt?: string;
|
|
characterPrompt?: string;
|
|
testMode?: boolean;
|
|
} = {}
|
|
): Promise<{ success: boolean; message: string; data?: any }> {
|
|
const project = await db.getProject(projectId);
|
|
if (!project) {
|
|
return { success: false, message: "Projet introuvable" };
|
|
}
|
|
|
|
switch (action) {
|
|
case "detect_scenes":
|
|
return await detectScenes(projectId, project);
|
|
case "analyze_backgrounds":
|
|
return await analyzeBackgrounds(projectId);
|
|
case "select_references":
|
|
return await selectReferences(projectId);
|
|
case "segment_characters":
|
|
return await segmentCharacters(projectId, options.testMode);
|
|
case "inpaint_backgrounds":
|
|
return await inpaintBackgrounds(projectId);
|
|
case "regenerate_backgrounds":
|
|
return await regenerateBackgrounds(projectId, options.backgroundPrompt);
|
|
case "regenerate_characters":
|
|
return await regenerateCharacters(projectId, options.characterPrompt);
|
|
case "composite_all":
|
|
return await compositeAll(projectId);
|
|
case "full_auto":
|
|
return await fullAutoCompose(projectId, options);
|
|
default:
|
|
return { success: false, message: "Action non reconnue" };
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Step 1: Detect scene cuts in the video
|
|
* Uses ffmpeg scene detection on the source video when available,
|
|
* falls back to histogram-based detection otherwise.
|
|
*/
|
|
async function detectScenes(projectId: number, project: any) {
|
|
const totalFrames = project.totalFrames || 576;
|
|
const fps = project.fps || 24;
|
|
|
|
// Delete existing sequences for this project to avoid duplicates
|
|
const existingSequences = await db.listSequences(projectId);
|
|
for (const seq of existingSequences) {
|
|
const dbInstance = await db.getDb();
|
|
if (dbInstance) {
|
|
const { layers: layersTable, sequences: seqTable } = await import("../drizzle/schema");
|
|
const { eq } = await import("drizzle-orm");
|
|
await dbInstance.delete(layersTable).where(eq(layersTable.sequenceId, seq.id));
|
|
await dbInstance.delete(seqTable).where(eq(seqTable.id, seq.id));
|
|
}
|
|
}
|
|
|
|
let sceneCuts: Array<{ frameIndex: number; confidence: number; type: string }> = [];
|
|
|
|
// Try real scene detection if source video is available
|
|
if (project.sourceVideoUrl) {
|
|
try {
|
|
const { storageGetSignedUrl } = await import("./storage");
|
|
const { detectSceneCutsFromVideo, cleanupDir } = await import("./ffmpegLocal");
|
|
const { mkdtemp } = await import("fs/promises");
|
|
const { createWriteStream } = await import("fs");
|
|
const { Readable } = await import("stream");
|
|
const { pipeline } = await import("stream/promises");
|
|
const { tmpdir } = await import("os");
|
|
const { join } = await import("path");
|
|
|
|
const videoKey = project.sourceVideoUrl.replace(/^\/manus-storage\//, "");
|
|
const signedUrl = await storageGetSignedUrl(videoKey);
|
|
|
|
const tempDir = await mkdtemp(join(tmpdir(), "retrotoon-scene-"));
|
|
const ext = videoKey.split(".").pop() || "mp4";
|
|
const videoPath = join(tempDir, `source.${ext}`);
|
|
|
|
const resp = await fetch(signedUrl);
|
|
if (resp.ok && resp.body) {
|
|
const nodeStream = Readable.fromWeb(resp.body as any);
|
|
await pipeline(nodeStream, createWriteStream(videoPath));
|
|
|
|
console.log(`[SceneDetect] Running ffmpeg scene detection on project ${projectId}...`);
|
|
const cuts = await detectSceneCutsFromVideo(videoPath, 0.3);
|
|
console.log(`[SceneDetect] Found ${cuts.length} scene cuts via ffmpeg`);
|
|
|
|
sceneCuts = cuts.map(c => ({
|
|
frameIndex: Math.round(c.time * fps),
|
|
confidence: Math.min(0.99, 0.7 + c.score),
|
|
type: "hard_cut",
|
|
}));
|
|
}
|
|
await cleanupDir(tempDir);
|
|
} catch (err) {
|
|
console.warn("[SceneDetect] Real detection failed, falling back to histogram:", err);
|
|
}
|
|
}
|
|
|
|
// Fallback to synthetic histogram detection
|
|
if (sceneCuts.length === 0) {
|
|
const cuts = await videoProcessor.detectSceneCuts(projectId, totalFrames, fps);
|
|
sceneCuts = cuts;
|
|
}
|
|
|
|
// Create sequences from detected cuts
|
|
let prevFrame = 0;
|
|
for (let i = 0; i < sceneCuts.length; i++) {
|
|
const cut = sceneCuts[i];
|
|
if (cut.frameIndex > prevFrame) {
|
|
await db.createSequence({
|
|
projectId,
|
|
name: `Séquence ${i + 1}`,
|
|
startFrame: prevFrame,
|
|
endFrame: cut.frameIndex - 1,
|
|
status: "detected",
|
|
});
|
|
}
|
|
prevFrame = cut.frameIndex;
|
|
}
|
|
|
|
if (prevFrame < totalFrames) {
|
|
await db.createSequence({
|
|
projectId,
|
|
name: `Séquence ${sceneCuts.length + 1}`,
|
|
startFrame: prevFrame,
|
|
endFrame: totalFrames - 1,
|
|
status: "detected",
|
|
});
|
|
}
|
|
|
|
const seqCount = sceneCuts.length + (prevFrame < totalFrames ? 1 : 0);
|
|
const method = sceneCuts.length > 0 && project.sourceVideoUrl ? "ffmpeg scene detection" : "histogram analysis";
|
|
|
|
return {
|
|
success: true,
|
|
message: `${seqCount} séquences détectées par ${method}.`,
|
|
data: { sequenceCount: seqCount, cuts: sceneCuts },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 2: Analyze backgrounds to determine which are static
|
|
* Uses Gemini vision to compare frames at start/middle/end of each sequence
|
|
*/
|
|
async function analyzeBackgrounds(projectId: number) {
|
|
const sequences = await db.listSequences(projectId);
|
|
const frames = await db.listFrames(projectId);
|
|
const { invokeConfiguredLLM } = await import("./llmConfig");
|
|
let staticCount = 0;
|
|
let analyzedCount = 0;
|
|
|
|
for (const seq of sequences) {
|
|
const seqFrames = frames.filter(
|
|
f => f.frameIndex >= seq.startFrame && f.frameIndex <= seq.endFrame && f.originalUrl
|
|
);
|
|
|
|
if (seqFrames.length < 2) {
|
|
await db.updateSequence(seq.id, { isStaticBackground: true });
|
|
staticCount++;
|
|
continue;
|
|
}
|
|
|
|
const sampleIndices = [
|
|
0,
|
|
Math.floor(seqFrames.length / 2),
|
|
seqFrames.length - 1,
|
|
];
|
|
const sampleUrls = Array.from(new Set(sampleIndices.map(i => seqFrames[i]?.originalUrl))).filter(Boolean) as string[];
|
|
|
|
if (sampleUrls.length < 2) {
|
|
await db.updateSequence(seq.id, { isStaticBackground: true });
|
|
staticCount++;
|
|
continue;
|
|
}
|
|
|
|
try {
|
|
const imageContent = sampleUrls.map(url => ({
|
|
type: "image_url" as const,
|
|
image_url: { url: url.startsWith("/") ? `https://retrotoon.cosmolan.fr${url}` : url },
|
|
}));
|
|
|
|
const response = await invokeConfiguredLLM({
|
|
messages: [
|
|
{
|
|
role: "system",
|
|
content: "Tu es un analyste d'animation. Réponds uniquement en JSON valide.",
|
|
},
|
|
{
|
|
role: "user",
|
|
content: [
|
|
{
|
|
type: "text" as const,
|
|
text: `Voici ${sampleUrls.length} frames d'une séquence de dessin animé. Compare les arrière-plans (décors). Réponds en JSON: {"isStaticBackground": true/false, "confidence": 0.0-1.0, "reason": "explication courte"}. isStaticBackground=true si le décor reste identique entre les frames (typique animation classique où seuls les personnages bougent).`,
|
|
},
|
|
...imageContent,
|
|
],
|
|
},
|
|
],
|
|
response_format: {
|
|
type: "json_schema",
|
|
json_schema: {
|
|
name: "background_analysis",
|
|
strict: true,
|
|
schema: {
|
|
type: "object",
|
|
properties: {
|
|
isStaticBackground: { type: "boolean" },
|
|
confidence: { type: "number" },
|
|
reason: { type: "string" },
|
|
},
|
|
required: ["isStaticBackground", "confidence", "reason"],
|
|
additionalProperties: false,
|
|
},
|
|
},
|
|
},
|
|
});
|
|
|
|
const content = response.choices?.[0]?.message?.content;
|
|
if (content && typeof content === "string") {
|
|
const analysis = JSON.parse(content);
|
|
console.log(`[BgAnalysis] Seq ${seq.id}: static=${analysis.isStaticBackground} (${analysis.confidence}) - ${analysis.reason}`);
|
|
await db.updateSequence(seq.id, { isStaticBackground: analysis.isStaticBackground });
|
|
if (analysis.isStaticBackground) staticCount++;
|
|
analyzedCount++;
|
|
continue;
|
|
}
|
|
} catch (err) {
|
|
console.warn(`[BgAnalysis] LLM analysis failed for seq ${seq.id}, defaulting to static:`, err);
|
|
}
|
|
|
|
await db.updateSequence(seq.id, { isStaticBackground: true });
|
|
staticCount++;
|
|
}
|
|
|
|
const method = analyzedCount > 0 ? "analyse Gemini Vision" : "heuristique";
|
|
return {
|
|
success: true,
|
|
message: `Analyse terminée (${method}): ${staticCount}/${sequences.length} séquences ont un arrière-plan statique.`,
|
|
data: { staticCount, totalSequences: sequences.length, analyzedByVision: analyzedCount },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 3: Select the best reference frame for each static sequence
|
|
*/
|
|
async function selectReferences(projectId: number) {
|
|
const sequences = await db.listSequences(projectId);
|
|
const staticSequences = sequences.filter((s) => s.isStaticBackground);
|
|
let selectedCount = 0;
|
|
|
|
for (const seq of staticSequences) {
|
|
// Select middle frame as reference (simplified)
|
|
// In production, would analyze each frame for quality
|
|
const refFrame = Math.floor((seq.startFrame + seq.endFrame) / 2);
|
|
await db.updateSequence(seq.id, { referenceFrameIndex: refFrame });
|
|
selectedCount++;
|
|
}
|
|
|
|
return {
|
|
success: true,
|
|
message: `${selectedCount} frames de référence sélectionnées (meilleure qualité, moins d'occlusion par les personnages).`,
|
|
data: { selectedCount },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 4: Segment characters from backgrounds
|
|
*/
|
|
async function segmentCharacters(projectId: number, testMode?: boolean) {
|
|
const sequences = await db.listSequences(projectId);
|
|
|
|
if (testMode) {
|
|
// Only process first frame of first sequence
|
|
const firstSeq = sequences[0];
|
|
if (firstSeq) {
|
|
// Create test layers
|
|
await db.createLayer({
|
|
sequenceId: firstSeq.id,
|
|
projectId,
|
|
name: "Fond (test)",
|
|
type: "background",
|
|
order: 0,
|
|
});
|
|
await db.createLayer({
|
|
sequenceId: firstSeq.id,
|
|
projectId,
|
|
name: "Personnage principal (test)",
|
|
type: "character",
|
|
order: 1,
|
|
});
|
|
}
|
|
return {
|
|
success: true,
|
|
message: "Mode test: segmentation appliquée sur la première frame uniquement. Vérifiez le résultat avant de lancer le traitement complet.",
|
|
};
|
|
}
|
|
|
|
// Full segmentation
|
|
let layerCount = 0;
|
|
for (const seq of sequences) {
|
|
// Create background layer
|
|
await db.createLayer({
|
|
sequenceId: seq.id,
|
|
projectId,
|
|
name: `Fond - ${seq.name || `Séq. ${seq.id}`}`,
|
|
type: "background",
|
|
order: 0,
|
|
});
|
|
layerCount++;
|
|
|
|
// Create character layer (simplified - would detect actual characters)
|
|
await db.createLayer({
|
|
sequenceId: seq.id,
|
|
projectId,
|
|
name: `Personnage - ${seq.name || `Séq. ${seq.id}`}`,
|
|
type: "character",
|
|
order: 1,
|
|
});
|
|
layerCount++;
|
|
|
|
await db.updateSequence(seq.id, { status: "processing" });
|
|
}
|
|
|
|
return {
|
|
success: true,
|
|
message: `Segmentation terminée: ${layerCount} calques créés (fond + personnages) pour ${sequences.length} séquences.`,
|
|
data: { layerCount, sequenceCount: sequences.length },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 5: Inpaint backgrounds to remove character remnants
|
|
*/
|
|
async function inpaintBackgrounds(projectId: number) {
|
|
const sequences = await db.listSequences(projectId);
|
|
const staticSequences = sequences.filter((s) => s.isStaticBackground && s.referenceFrameIndex != null);
|
|
|
|
for (const seq of staticSequences) {
|
|
// In production, would actually inpaint the reference frame
|
|
await db.updateSequence(seq.id, { status: "processing" });
|
|
}
|
|
|
|
return {
|
|
success: true,
|
|
message: `Inpainting lancé sur ${staticSequences.length} arrière-plans de référence. Les personnages sont retirés et le fond est reconstruit.`,
|
|
data: { processedCount: staticSequences.length },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 6: Regenerate backgrounds with new style
|
|
*/
|
|
async function regenerateBackgrounds(projectId: number, prompt?: string) {
|
|
if (!prompt) {
|
|
return {
|
|
success: false,
|
|
message: "Veuillez fournir un prompt décrivant le style souhaité pour les arrière-plans.",
|
|
};
|
|
}
|
|
|
|
const sequences = await db.listSequences(projectId);
|
|
const staticSequences = sequences.filter((s) => s.isStaticBackground);
|
|
|
|
// Create generation job
|
|
await db.createGenerationJob({
|
|
projectId,
|
|
type: "background_gen",
|
|
prompt,
|
|
status: "running",
|
|
progress: 0,
|
|
});
|
|
|
|
return {
|
|
success: true,
|
|
message: `Regénération des arrière-plans lancée avec le prompt: "${prompt}". ${staticSequences.length} fonds seront redessinés en conservant la perspective et la composition d'origine.`,
|
|
data: { sequenceCount: staticSequences.length, prompt },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 7: Regenerate characters with new style
|
|
*/
|
|
async function regenerateCharacters(projectId: number, prompt?: string) {
|
|
if (!prompt) {
|
|
return {
|
|
success: false,
|
|
message: "Veuillez fournir un prompt décrivant le style souhaité pour les personnages.",
|
|
};
|
|
}
|
|
|
|
await db.createGenerationJob({
|
|
projectId,
|
|
type: "character_gen",
|
|
prompt,
|
|
status: "running",
|
|
progress: 0,
|
|
});
|
|
|
|
return {
|
|
success: true,
|
|
message: `Regénération des personnages lancée avec le prompt: "${prompt}". Les poses et proportions d'origine seront strictement respectées.`,
|
|
data: { prompt },
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Step 8: Composite all layers together
|
|
*/
|
|
async function compositeAll(projectId: number) {
|
|
await db.updateProject(projectId, { status: "compositing" });
|
|
|
|
await db.createGenerationJob({
|
|
projectId,
|
|
type: "auto_compose",
|
|
status: "running",
|
|
progress: 0,
|
|
});
|
|
|
|
return {
|
|
success: true,
|
|
message: "Compositing final lancé. Les calques (fond regénéré + personnages) sont recomposés frame par frame avec la bande audio originale.",
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Full autonomous pipeline
|
|
*/
|
|
async function fullAutoCompose(
|
|
projectId: number,
|
|
options: { backgroundPrompt?: string; characterPrompt?: string; testMode?: boolean }
|
|
) {
|
|
const steps = [
|
|
"Détection des plans",
|
|
"Analyse des arrière-plans",
|
|
"Sélection des références",
|
|
"Segmentation des personnages",
|
|
"Inpainting des fonds",
|
|
];
|
|
|
|
// Execute pipeline steps
|
|
await detectScenes(projectId, await db.getProject(projectId));
|
|
await analyzeBackgrounds(projectId);
|
|
await selectReferences(projectId);
|
|
await segmentCharacters(projectId, options.testMode);
|
|
await inpaintBackgrounds(projectId);
|
|
|
|
if (options.backgroundPrompt) {
|
|
await regenerateBackgrounds(projectId, options.backgroundPrompt);
|
|
}
|
|
if (options.characterPrompt) {
|
|
await regenerateCharacters(projectId, options.characterPrompt);
|
|
}
|
|
|
|
return {
|
|
success: true,
|
|
message: `Pipeline autonome terminé !\n\n**Étapes complétées:**\n${steps.map((s, i) => `${i + 1}. ✅ ${s}`).join("\n")}\n\nLe projet est prêt pour la regénération. Fournissez vos prompts de style pour les arrière-plans et/ou les personnages.`,
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Generate a natural language analysis of the project state
|
|
*/
|
|
export async function generateProjectAnalysis(projectId: number): Promise<string> {
|
|
const project = await db.getProject(projectId);
|
|
const sequences = await db.listSequences(projectId);
|
|
const layers = await db.listLayers(projectId);
|
|
const characters = await db.listCharacters(projectId);
|
|
const jobs = await db.listGenerationJobs(projectId);
|
|
|
|
const context = {
|
|
project: project?.name,
|
|
status: project?.status,
|
|
totalFrames: project?.totalFrames,
|
|
fps: project?.fps,
|
|
sequenceCount: sequences.length,
|
|
staticBgCount: sequences.filter((s) => s.isStaticBackground).length,
|
|
layerCount: layers.length,
|
|
characterCount: characters.length,
|
|
completedJobs: jobs.filter((j) => j.status === "completed").length,
|
|
pendingJobs: jobs.filter((j) => j.status === "queued" || j.status === "running").length,
|
|
};
|
|
|
|
try {
|
|
const response = await invokeLLM({
|
|
messages: [
|
|
{
|
|
role: "system",
|
|
content: `Tu es l'assistant opérateur de RetroToon Studio. Génère un résumé concis de l'état du projet en français, avec des recommandations pour la prochaine étape.`,
|
|
},
|
|
{
|
|
role: "user",
|
|
content: `État du projet: ${JSON.stringify(context)}`,
|
|
},
|
|
],
|
|
});
|
|
|
|
const content = response.choices?.[0]?.message?.content;
|
|
return (typeof content === "string" ? content : null) || "Analyse en cours...";
|
|
} catch {
|
|
return `Projet "${project?.name}" - ${sequences.length} séquences, ${layers.length} calques. Prochaine étape recommandée: ${
|
|
sequences.length === 0
|
|
? "Détection des plans"
|
|
: layers.length === 0
|
|
? "Segmentation des personnages"
|
|
: "Regénération IA"
|
|
}`;
|
|
}
|
|
}
|