Protokoll #4248

ID4248
Zeitstempel2025-12-22 09:35:09.101303
Clientroot
IP
Warning: Undefined array key "request_ip" in /var/www/dev.campus.systemische-tools.de/src/View/protokoll/show.php on line 13

Deprecated: htmlspecialchars(): Passing null to parameter #1 ($string) of type string is deprecated in /var/www/dev.campus.systemische-tools.de/src/View/protokoll/show.php on line 13
Modellclaude-sonnet-4-20250514
Statuscompleted
Tokens7,439 (Input: 0, Output: 0)
Dauer104 ms
Request-Zeit
Warning: Undefined array key "request_timestamp" in /var/www/dev.campus.systemische-tools.de/src/View/protokoll/show.php on line 18
Response-Zeit-

Warning: Undefined array key "error_message" in /var/www/dev.campus.systemische-tools.de/src/View/protokoll/show.php on line 22

Request

{
    "event": "PreToolUse",
    "tool_name": "Edit",
    "tool_input": {
        "file_path": "\/var\/www\/dev.campus.systemische-tools.de\/src\/Controller\/ContentPipelineController.php",
        "old_string": "    \/**\n     * @return array<string, array<string, mixed>>\n     *\/\n    private function getStepTypes(): array\n    {\n        return [\n            'detect' => [\n                'label' => 'Detect',\n                'icon' => 'search',\n                'description' => 'Scannt Nextcloud nach neuen\/geaenderten Dateien',\n                'configFields' => ['hash_algorithm'],\n            ],\n            'extract' => [\n                'label' => 'Extract',\n                'icon' => 'file-text',\n                'description' => 'Extrahiert Text aus PDF, DOCX, PPTX, MD, TXT',\n                'configFields' => ['ocr_enabled', 'ocr_language'],\n            ],\n            'chunk' => [\n                'label' => 'Chunk',\n                'icon' => 'scissors',\n                'description' => 'Teilt Text in semantische Chunks',\n                'configFields' => ['min_size', 'max_size', 'overlap'],\n            ],\n            'embed' => [\n                'label' => 'Embed',\n                'icon' => 'cpu',\n                'description' => 'Generiert Embeddings via Ollama',\n                'configFields' => ['model', 'collection', 'dimensions'],\n            ],\n            'analyze' => [\n                'label' => 'Analyze',\n                'icon' => 'brain',\n                'description' => 'Extrahiert Entitaeten, Relationen, Taxonomie',\n                'configFields' => ['extract_entities', 'extract_relations', 'classify_taxonomy', 'model'],\n            ],\n        ];\n    }",
        "new_string": "    \/**\n     * @return array<string, array<string, mixed>>\n     *\/\n    private function getStepTypes(): array\n    {\n        return [\n            \/\/ Phase 1: Preprocessing\n            'detect' => [\n                'label' => '1. Detect',\n                'icon' => 'search',\n                'description' => 'Dateien scannen und Format pruefen',\n                'phase' => 'Preprocessing',\n            ],\n            'validate' => [\n                'label' => '2. Validate',\n                'icon' => 'check',\n                'description' => 'Datei-Validierung und Korruptionspruefung',\n                'phase' => 'Preprocessing',\n            ],\n            'extract' => [\n                'label' => '3. Extract',\n                'icon' => 'file-text',\n                'description' => 'Text extrahieren und bereinigen',\n                'phase' => 'Preprocessing',\n            ],\n            'structure' => [\n                'label' => '4. Structure',\n                'icon' => 'list',\n                'description' => 'Ueberschriften und Struktur erkennen',\n                'phase' => 'Preprocessing',\n            ],\n            'segment' => [\n                'label' => '5. Segment',\n                'icon' => 'layout',\n                'description' => 'Logische Dokumentgliederung',\n                'phase' => 'Preprocessing',\n            ],\n            'chunk' => [\n                'label' => '6. Chunk',\n                'icon' => 'scissors',\n                'description' => 'Textbausteine erstellen (max 800 Token)',\n                'phase' => 'Preprocessing',\n            ],\n            \/\/ Phase 2: Embedding & Storage\n            'embed' => [\n                'label' => '7. Embed',\n                'icon' => 'cpu',\n                'description' => 'Vektorisierung mit mxbai-embed-large',\n                'phase' => 'Embedding',\n            ],\n            'collection_setup' => [\n                'label' => '8. Collection',\n                'icon' => 'database',\n                'description' => 'Qdrant-Collection einrichten',\n                'phase' => 'Embedding',\n            ],\n            'vector_store' => [\n                'label' => '9. Store',\n                'icon' => 'upload',\n                'description' => 'Vektoren in Qdrant speichern',\n                'phase' => 'Embedding',\n            ],\n            'metadata_store' => [\n                'label' => '10. Metadata',\n                'icon' => 'tag',\n                'description' => 'Metadaten in MariaDB speichern',\n                'phase' => 'Embedding',\n            ],\n            'index_optimize' => [\n                'label' => '11. Index',\n                'icon' => 'zap',\n                'description' => 'HNSW-Index optimieren',\n                'phase' => 'Embedding',\n            ],\n            \/\/ Phase 3: Analysis\n            'entity_extract' => [\n                'label' => '12. Entities',\n                'icon' => 'users',\n                'description' => 'Entitaeten erkennen (Personen, Konzepte)',\n                'phase' => 'Analysis',\n            ],\n            'relation_extract' => [\n                'label' => '13. Relations',\n                'icon' => 'git-branch',\n                'description' => 'Beziehungen zwischen Entitaeten',\n                'phase' => 'Analysis',\n            ],\n            'taxonomy_build' => [\n                'label' => '14. Taxonomy',\n                'icon' => 'folder-tree',\n                'description' => 'Hierarchische Kategorisierung',\n                'phase' => 'Analysis',\n            ],\n            'semantic_analyze' => [\n                'label' => '15. Semantic',\n                'icon' => 'brain',\n                'description' => 'Bedeutungs-Analyse und Konzepte',\n                'phase' => 'Analysis',\n            ],\n            'summarize' => [\n                'label' => '16. Summary',\n                'icon' => 'file-minus',\n                'description' => 'Dokument-Zusammenfassung',\n                'phase' => 'Analysis',\n            ],\n            'finalize' => [\n                'label' => '17. Finalize',\n                'icon' => 'check-circle',\n                'description' => 'Job abschliessen und Status setzen',\n                'phase' => 'Analysis',\n            ],\n            'question_generate' => [\n                'label' => '18. Questions',\n                'icon' => 'help-circle',\n                'description' => 'Beispielfragen fuer RAG-Chat generieren',\n                'phase' => 'Analysis',\n            ],\n            \/\/ Legacy\n            'analyze' => [\n                'label' => 'Analyze',\n                'icon' => 'brain',\n                'description' => 'Kombinierte Analyse (Legacy)',\n                'phase' => 'Analysis',\n            ],\n        ];\n    }"
    }
}

Response

{
    "tool_response": {
        "filePath": "\/var\/www\/dev.campus.systemische-tools.de\/src\/Controller\/ContentPipelineController.php",
        "oldString": "    \/**\n     * @return array<string, array<string, mixed>>\n     *\/\n    private function getStepTypes(): array\n    {\n        return [\n            'detect' => [\n                'label' => 'Detect',\n                'icon' => 'search',\n                'description' => 'Scannt Nextcloud nach neuen\/geaenderten Dateien',\n                'configFields' => ['hash_algorithm'],\n            ],\n            'extract' => [\n                'label' => 'Extract',\n                'icon' => 'file-text',\n                'description' => 'Extrahiert Text aus PDF, DOCX, PPTX, MD, TXT',\n                'configFields' => ['ocr_enabled', 'ocr_language'],\n            ],\n            'chunk' => [\n                'label' => 'Chunk',\n                'icon' => 'scissors',\n                'description' => 'Teilt Text in semantische Chunks',\n                'configFields' => ['min_size', 'max_size', 'overlap'],\n            ],\n            'embed' => [\n                'label' => 'Embed',\n                'icon' => 'cpu',\n                'description' => 'Generiert Embeddings via Ollama',\n                'configFields' => ['model', 'collection', 'dimensions'],\n            ],\n            'analyze' => [\n                'label' => 'Analyze',\n                'icon' => 'brain',\n                'description' => 'Extrahiert Entitaeten, Relationen, Taxonomie',\n                'configFields' => ['extract_entities', 'extract_relations', 'classify_taxonomy', 'model'],\n            ],\n        ];\n    }",
        "newString": "    \/**\n     * @return array<string, array<string, mixed>>\n     *\/\n    private function getStepTypes(): array\n    {\n        return [\n            \/\/ Phase 1: Preprocessing\n            'detect' => [\n                'label' => '1. Detect',\n                'icon' => 'search',\n                'description' => 'Dateien scannen und Format pruefen',\n                'phase' => 'Preprocessing',\n            ],\n            'validate' => [\n                'label' => '2. Validate',\n                'icon' => 'check',\n                'description' => 'Datei-Validierung und Korruptionspruefung',\n                'phase' => 'Preprocessing',\n            ],\n            'extract' => [\n                'label' => '3. Extract',\n                'icon' => 'file-text',\n                'description' => 'Text extrahieren und bereinigen',\n                'phase' => 'Preprocessing',\n            ],\n            'structure' => [\n                'label' => '4. Structure',\n                'icon' => 'list',\n                'description' => 'Ueberschriften und Struktur erkennen',\n                'phase' => 'Preprocessing',\n            ],\n            'segment' => [\n                'label' => '5. Segment',\n                'icon' => 'layout',\n                'description' => 'Logische Dokumentgliederung',\n                'phase' => 'Preprocessing',\n            ],\n            'chunk' => [\n                'label' => '6. Chunk',\n                'icon' => 'scissors',\n                'description' => 'Textbausteine erstellen (max 800 Token)',\n                'phase' => 'Preprocessing',\n            ],\n            \/\/ Phase 2: Embedding & Storage\n            'embed' => [\n                'label' => '7. Embed',\n                'icon' => 'cpu',\n                'description' => 'Vektorisierung mit mxbai-embed-large',\n                'phase' => 'Embedding',\n            ],\n            'collection_setup' => [\n                'label' => '8. Collection',\n                'icon' => 'database',\n                'description' => 'Qdrant-Collection einrichten',\n                'phase' => 'Embedding',\n            ],\n            'vector_store' => [\n                'label' => '9. Store',\n                'icon' => 'upload',\n                'description' => 'Vektoren in Qdrant speichern',\n                'phase' => 'Embedding',\n            ],\n            'metadata_store' => [\n                'label' => '10. Metadata',\n                'icon' => 'tag',\n                'description' => 'Metadaten in MariaDB speichern',\n                'phase' => 'Embedding',\n            ],\n            'index_optimize' => [\n                'label' => '11. Index',\n                'icon' => 'zap',\n                'description' => 'HNSW-Index optimieren',\n                'phase' => 'Embedding',\n            ],\n            \/\/ Phase 3: Analysis\n            'entity_extract' => [\n                'label' => '12. Entities',\n                'icon' => 'users',\n                'description' => 'Entitaeten erkennen (Personen, Konzepte)',\n                'phase' => 'Analysis',\n            ],\n            'relation_extract' => [\n                'label' => '13. Relations',\n                'icon' => 'git-branch',\n                'description' => 'Beziehungen zwischen Entitaeten',\n                'phase' => 'Analysis',\n            ],\n            'taxonomy_build' => [\n                'label' => '14. Taxonomy',\n                'icon' => 'folder-tree',\n                'description' => 'Hierarchische Kategorisierung',\n                'phase' => 'Analysis',\n            ],\n            'semantic_analyze' => [\n                'label' => '15. Semantic',\n                'icon' => 'brain',\n                'description' => 'Bedeutungs-Analyse und Konzepte',\n                'phase' => 'Analysis',\n            ],\n            'summarize' => [\n                'label' => '16. Summary',\n                'icon' => 'file-minus',\n                'description' => 'Dokument-Zusammenfassung',\n                'phase' => 'Analysis',\n            ],\n            'finalize' => [\n                'label' => '17. Finalize',\n                'icon' => 'check-circle',\n                'description' => 'Job abschliessen und Status setzen',\n                'phase' => 'Analysis',\n            ],\n            'question_generate' => [\n                'label' => '18. Questions',\n                'icon' => 'help-circle',\n                'description' => 'Beispielfragen fuer RAG-Chat generieren',\n                'phase' => 'Analysis',\n            ],\n            \/\/ Legacy\n            'analyze' => [\n                'label' => 'Analyze',\n                'icon' => 'brain',\n                'description' => 'Kombinierte Analyse (Legacy)',\n                'phase' => 'Analysis',\n            ],\n        ];\n    }",
        "originalFile": "<?php\n\nnamespace Controller;\n\nuse Framework\\Controller;\nuse Infrastructure\\Persistence\\PipelineRepository;\n\nclass ContentPipelineController extends Controller\n{\n    private PipelineRepository $repository;\n\n    public function __construct()\n    {\n        $this->repository = new PipelineRepository();\n    }\n\n    \/**\n     * GET \/content-pipeline\n     *\/\n    public function index(): void\n    {\n        $pipelines = $this->repository->findAll();\n        $stats = $this->repository->getStatistics();\n\n        $this->view('content-pipeline.index', [\n            'title' => 'Content Pipeline',\n            'pipelines' => $pipelines,\n            'stats' => $stats,\n        ]);\n    }\n\n    \/**\n     * GET \/content-pipeline\/import\n     *\/\n    public function import(): void\n    {\n        $pipeline = $this->repository->findDefault();\n\n        if ($pipeline === null) {\n            $pipelines = $this->repository->findAll(1);\n            $pipeline = $pipelines[0] ?? null;\n        }\n\n        $latestRun = $pipeline !== null\n            ? $this->repository->findLatestRun((int) $pipeline['id'])\n            : null;\n\n        $this->view('content-pipeline.import', [\n            'title' => 'Import Pipeline',\n            'pipeline' => $pipeline,\n            'latestRun' => $latestRun,\n        ]);\n    }\n\n    \/**\n     * GET \/content-pipeline\/new\n     *\/\n    public function pipelineNew(): void\n    {\n        $this->view('content-pipeline.form', [\n            'title' => 'Neue Pipeline',\n            'pipeline' => null,\n            'stepTypes' => $this->getStepTypes(),\n        ]);\n    }\n\n    \/**\n     * GET \/content-pipeline\/{id}\n     *\/\n    public function show(string $id): void\n    {\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        $runs = $this->repository->findRuns((int) $id, 10);\n\n        $this->view('content-pipeline.show', [\n            'title' => 'Pipeline: ' . $pipeline['name'],\n            'pipeline' => $pipeline,\n            'runs' => $runs,\n            'stepTypes' => $this->getStepTypes(),\n        ]);\n    }\n\n    \/**\n     * GET \/content-pipeline\/{id}\/edit\n     *\/\n    public function edit(string $id): void\n    {\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        $this->view('content-pipeline.form', [\n            'title' => 'Pipeline bearbeiten: ' . $pipeline['name'],\n            'pipeline' => $pipeline,\n            'stepTypes' => $this->getStepTypes(),\n        ]);\n    }\n\n    \/**\n     * POST \/content-pipeline\n     *\/\n    public function store(): void\n    {\n        $this->requireCsrf();\n\n        $name = trim($_POST['name'] ?? '');\n        $description = trim($_POST['description'] ?? '');\n        $sourcePath = trim($_POST['source_path'] ?? '\/var\/www\/nextcloud\/data\/root\/files\/Documents');\n        $extensions = $this->parseExtensions($_POST['extensions'] ?? '');\n        $isDefault = isset($_POST['is_default']) ? 1 : 0;\n\n        if ($name === '') {\n            $_SESSION['error'] = 'Name ist erforderlich.';\n            header('Location: \/content-pipeline\/new');\n            exit;\n        }\n\n        $pipelineId = $this->repository->create([\n            'name' => $name,\n            'description' => $description,\n            'source_path' => $sourcePath,\n            'extensions' => $extensions,\n            'is_default' => $isDefault,\n        ]);\n\n        \/\/ Standard-Steps hinzufuegen\n        $this->createDefaultSteps($pipelineId);\n\n        $_SESSION['success'] = 'Pipeline erfolgreich erstellt.';\n        header('Location: \/content-pipeline\/' . $pipelineId);\n        exit;\n    }\n\n    \/**\n     * POST \/content-pipeline\/{id}\n     *\/\n    public function update(string $id): void\n    {\n        $this->requireCsrf();\n\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        $name = trim($_POST['name'] ?? '');\n        $description = trim($_POST['description'] ?? '');\n        $sourcePath = trim($_POST['source_path'] ?? '');\n        $extensions = $this->parseExtensions($_POST['extensions'] ?? '');\n        $isDefault = isset($_POST['is_default']) ? 1 : 0;\n\n        if ($name === '') {\n            $_SESSION['error'] = 'Name ist erforderlich.';\n            header('Location: \/content-pipeline\/' . $id . '\/edit');\n            exit;\n        }\n\n        $this->repository->update((int) $id, [\n            'name' => $name,\n            'description' => $description,\n            'source_path' => $sourcePath,\n            'extensions' => $extensions,\n            'is_default' => $isDefault,\n        ]);\n\n        $_SESSION['success'] = 'Pipeline aktualisiert.';\n        header('Location: \/content-pipeline\/' . $id);\n        exit;\n    }\n\n    \/**\n     * POST \/content-pipeline\/{id}\/run\n     *\/\n    public function run(string $id): void\n    {\n        $this->requireCsrf();\n\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        \/\/ Neuen Run erstellen\n        $runId = $this->repository->createRun((int) $id);\n\n        \/\/ Pipeline im Hintergrund starten\n        $pipelineScript = '\/opt\/scripts\/pipeline\/pipeline.py';\n        $venvPython = '\/opt\/scripts\/pipeline\/venv\/bin\/python';\n        $logFile = '\/tmp\/pipeline_run_' . $runId . '.log';\n\n        $cmd = sprintf(\n            'nohup %s %s all --pipeline-id=%d --run-id=%d > %s 2>&1 &',\n            escapeshellarg($venvPython),\n            escapeshellarg($pipelineScript),\n            (int) $id,\n            $runId,\n            escapeshellarg($logFile)\n        );\n\n        exec($cmd);\n\n        $_SESSION['success'] = 'Pipeline gestartet (Run #' . $runId . ')';\n        header('Location: \/content-pipeline\/' . $id);\n        exit;\n    }\n\n    \/**\n     * GET \/content-pipeline\/{id}\/status\n     * AJAX endpoint for run status\n     *\/\n    public function status(string $id): void\n    {\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->json(['error' => 'Pipeline nicht gefunden'], 404);\n            return;\n        }\n\n        $latestRun = $this->repository->findLatestRun((int) $id);\n\n        $this->json([\n            'pipeline_id' => (int) $id,\n            'run' => $latestRun,\n        ]);\n    }\n\n    \/**\n     * POST \/content-pipeline\/{id}\/steps\/{stepId}\/toggle\n     *\/\n    public function toggleStep(string $id, string $stepId): void\n    {\n        $this->requireCsrf();\n\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        \/\/ Find step and toggle\n        foreach ($pipeline['steps'] as $step) {\n            if ((int) $step['id'] === (int) $stepId) {\n                $this->repository->updateStep((int) $stepId, [\n                    'enabled' => $step['enabled'] ? 0 : 1,\n                ]);\n                break;\n            }\n        }\n\n        header('Location: \/content-pipeline\/' . $id);\n        exit;\n    }\n\n    \/**\n     * POST \/content-pipeline\/{id}\/delete\n     *\/\n    public function delete(string $id): void\n    {\n        $this->requireCsrf();\n\n        $pipeline = $this->repository->findById((int) $id);\n\n        if ($pipeline === null) {\n            $this->notFound('Pipeline nicht gefunden');\n        }\n\n        $this->repository->delete((int) $id);\n\n        $_SESSION['success'] = 'Pipeline geloescht.';\n        header('Location: \/content-pipeline');\n        exit;\n    }\n\n    \/**\n     * @return array<string, array<string, mixed>>\n     *\/\n    private function getStepTypes(): array\n    {\n        return [\n            'detect' => [\n                'label' => 'Detect',\n                'icon' => 'search',\n                'description' => 'Scannt Nextcloud nach neuen\/geaenderten Dateien',\n                'configFields' => ['hash_algorithm'],\n            ],\n            'extract' => [\n                'label' => 'Extract',\n                'icon' => 'file-text',\n                'description' => 'Extrahiert Text aus PDF, DOCX, PPTX, MD, TXT',\n                'configFields' => ['ocr_enabled', 'ocr_language'],\n            ],\n            'chunk' => [\n                'label' => 'Chunk',\n                'icon' => 'scissors',\n                'description' => 'Teilt Text in semantische Chunks',\n                'configFields' => ['min_size', 'max_size', 'overlap'],\n            ],\n            'embed' => [\n                'label' => 'Embed',\n                'icon' => 'cpu',\n                'description' => 'Generiert Embeddings via Ollama',\n                'configFields' => ['model', 'collection', 'dimensions'],\n            ],\n            'analyze' => [\n                'label' => 'Analyze',\n                'icon' => 'brain',\n                'description' => 'Extrahiert Entitaeten, Relationen, Taxonomie',\n                'configFields' => ['extract_entities', 'extract_relations', 'classify_taxonomy', 'model'],\n            ],\n        ];\n    }\n\n    \/**\n     * @param string $input\n     * @return array<string>\n     *\/\n    private function parseExtensions(string $input): array\n    {\n        $extensions = [];\n        $parts = preg_split('\/[\\s,;]+\/', $input);\n\n        if ($parts === false) {\n            return ['.pdf', '.docx', '.pptx', '.md', '.txt'];\n        }\n\n        foreach ($parts as $ext) {\n            $ext = trim($ext);\n            if ($ext === '') {\n                continue;\n            }\n            if ($ext[0] !== '.') {\n                $ext = '.' . $ext;\n            }\n            $extensions[] = strtolower($ext);\n        }\n\n        return $extensions !== [] ? $extensions : ['.pdf', '.docx', '.pptx', '.md', '.txt'];\n    }\n\n    private function createDefaultSteps(int $pipelineId): void\n    {\n        $defaultSteps = [\n            ['step_type' => 'detect', 'config... [TRUNCATED-20081e070684db8e]",
        "structuredPatch": [
            {
                "oldStart": 287,
                "oldLines": 35,
                "newStart": 287,
                "newLines": 123,
                "lines": [
                    "     private function getStepTypes(): array",
                    "     {",
                    "         return [",
                    "+            \/\/ Phase 1: Preprocessing",
                    "             'detect' => [",
                    "-                'label' => 'Detect',",
                    "+                'label' => '1. Detect',",
                    "                 'icon' => 'search',",
                    "-                'description' => 'Scannt Nextcloud nach neuen\/geaenderten Dateien',",
                    "-                'configFields' => ['hash_algorithm'],",
                    "+                'description' => 'Dateien scannen und Format pruefen',",
                    "+                'phase' => 'Preprocessing',",
                    "             ],",
                    "+            'validate' => [",
                    "+                'label' => '2. Validate',",
                    "+                'icon' => 'check',",
                    "+                'description' => 'Datei-Validierung und Korruptionspruefung',",
                    "+                'phase' => 'Preprocessing',",
                    "+            ],",
                    "             'extract' => [",
                    "-                'label' => 'Extract',",
                    "+                'label' => '3. Extract',",
                    "                 'icon' => 'file-text',",
                    "-                'description' => 'Extrahiert Text aus PDF, DOCX, PPTX, MD, TXT',",
                    "-                'configFields' => ['ocr_enabled', 'ocr_language'],",
                    "+                'description' => 'Text extrahieren und bereinigen',",
                    "+                'phase' => 'Preprocessing',",
                    "             ],",
                    "+            'structure' => [",
                    "+                'label' => '4. Structure',",
                    "+                'icon' => 'list',",
                    "+                'description' => 'Ueberschriften und Struktur erkennen',",
                    "+                'phase' => 'Preprocessing',",
                    "+            ],",
                    "+            'segment' => [",
                    "+                'label' => '5. Segment',",
                    "+                'icon' => 'layout',",
                    "+                'description' => 'Logische Dokumentgliederung',",
                    "+                'phase' => 'Preprocessing',",
                    "+            ],",
                    "             'chunk' => [",
                    "-                'label' => 'Chunk',",
                    "+                'label' => '6. Chunk',",
                    "                 'icon' => 'scissors',",
                    "-                'description' => 'Teilt Text in semantische Chunks',",
                    "-                'configFields' => ['min_size', 'max_size', 'overlap'],",
                    "+                'description' => 'Textbausteine erstellen (max 800 Token)',",
                    "+                'phase' => 'Preprocessing',",
                    "             ],",
                    "+            \/\/ Phase 2: Embedding & Storage",
                    "             'embed' => [",
                    "-                'label' => 'Embed',",
                    "+                'label' => '7. Embed',",
                    "                 'icon' => 'cpu',",
                    "-                'description' => 'Generiert Embeddings via Ollama',",
                    "-                'configFields' => ['model', 'collection', 'dimensions'],",
                    "+                'description' => 'Vektorisierung mit mxbai-embed-large',",
                    "+                'phase' => 'Embedding',",
                    "             ],",
                    "+            'collection_setup' => [",
                    "+                'label' => '8. Collection',",
                    "+                'icon' => 'database',",
                    "+                'description' => 'Qdrant-Collection einrichten',",
                    "+                'phase' => 'Embedding',",
                    "+            ],",
                    "+            'vector_store' => [",
                    "+                'label' => '9. Store',",
                    "+                'icon' => 'upload',",
                    "+                'description' => 'Vektoren in Qdrant speichern',",
                    "+                'phase' => 'Embedding',",
                    "+            ],",
                    "+            'metadata_store' => [",
                    "+                'label' => '10. Metadata',",
                    "+                'icon' => 'tag',",
                    "+                'description' => 'Metadaten in MariaDB speichern',",
                    "+                'phase' => 'Embedding',",
                    "+            ],",
                    "+            'index_optimize' => [",
                    "+                'label' => '11. Index',",
                    "+                'icon' => 'zap',",
                    "+                'description' => 'HNSW-Index optimieren',",
                    "+                'phase' => 'Embedding',",
                    "+            ],",
                    "+            \/\/ Phase 3: Analysis",
                    "+            'entity_extract' => [",
                    "+                'label' => '12. Entities',",
                    "+                'icon' => 'users',",
                    "+                'description' => 'Entitaeten erkennen (Personen, Konzepte)',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'relation_extract' => [",
                    "+                'label' => '13. Relations',",
                    "+                'icon' => 'git-branch',",
                    "+                'description' => 'Beziehungen zwischen Entitaeten',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'taxonomy_build' => [",
                    "+                'label' => '14. Taxonomy',",
                    "+                'icon' => 'folder-tree',",
                    "+                'description' => 'Hierarchische Kategorisierung',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'semantic_analyze' => [",
                    "+                'label' => '15. Semantic',",
                    "+                'icon' => 'brain',",
                    "+                'description' => 'Bedeutungs-Analyse und Konzepte',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'summarize' => [",
                    "+                'label' => '16. Summary',",
                    "+                'icon' => 'file-minus',",
                    "+                'description' => 'Dokument-Zusammenfassung',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'finalize' => [",
                    "+                'label' => '17. Finalize',",
                    "+                'icon' => 'check-circle',",
                    "+                'description' => 'Job abschliessen und Status setzen',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            'question_generate' => [",
                    "+                'label' => '18. Questions',",
                    "+                'icon' => 'help-circle',",
                    "+                'description' => 'Beispielfragen fuer RAG-Chat generieren',",
                    "+                'phase' => 'Analysis',",
                    "+            ],",
                    "+            \/\/ Legacy",
                    "             'analyze' => [",
                    "                 'label' => 'Analyze',",
                    "                 'icon' => 'brain',",
                    "-                'description' => 'Extrahiert Entitaeten, Relationen, Taxonomie',",
                    "-                'configFields' => ['extract_entities', 'extract_relations', 'classify_taxonomy', 'model'],",
                    "+                'description' => 'Kombinierte Analyse (Legacy)',",
                    "+                'phase' => 'Analysis',",
                    "             ],",
                    "         ];",
                    "     }"
                ]
            }
        ],
        "userModified": false,
        "replaceAll": false
    }
}
← Vorheriger Zur Liste Nächster →