__init__.py

Code Hygiene Score: 100

Keine Issues gefunden.

Code

"""
KI-System Document Pipeline

A Python-based document processing pipeline for:
- Text extraction from PDF, PPTX, DOCX, MD, TXT
- Semantic chunking with hierarchy preservation
- Embedding generation via Ollama (mxbai-embed-large)
- Vector storage in Qdrant
- Semantic analysis (entities, relations, taxonomy)

Usage:
    from pipeline import pipeline
    pipeline.main()

Or from command line:
    python -m pipeline scan
    python -m pipeline process
    python -m pipeline all
"""

__version__ = "1.0.0"
← Übersicht