Initial commit: Python MCP server (Streamable HTTP, API key, return documents)

2026-06-13 06:02:13 +00:00
commit 269f3b9757
7 changed files with 1855 additions and 0 deletions
@@ -0,0 +1,70 @@
 # Dockerfile for py-docx-mcp (Python MCP server) - OpenWebUI: MCP (Streamable HTTP)
 # Usage:
 #   docker build -t py-docx-mcp .
 #   docker run --rm -p 3000:3000 py-docx-mcp
 #
 # In OpenWebUI:
 #   - Type: MCP (Streamable HTTP)
 #   - URL: http://<host>:3000
 #   - Auth: Bearer (if DOCX_MCP_API_KEY is set)
 #
 # Environment:
 #   DOCX_MCP_API_KEY            - API key (Bearer or X-API-Key). Optional but recommended.
 #   DOCX_MCP_HTTP_HOST          - Bind host (default: 0.0.0.0)
 #   DOCX_MCP_HTTP_PORT          - Bind port (default: 3000)
 #   DOCX_MCP_TEMPLATES_DIR      - Templates directory (default: /templates)
 #   DOCX_MCP_MAX_SIZE           - Max document size in bytes (default: 104857600)
 #   DOCX_MCP_MAX_DOCS           - Max open documents (default: 30)
 #   DOCX_MCP_SANDBOX            - Enable sandbox mode (default: true)
 #   DOCX_MCP_ALLOW_EXTERNAL_TOOLS - Allow external tools (default: false)
 #   DOCX_MCP_ALLOW_NETWORK      - Allow network access (default: false)
 FROM python:3.12-slim AS base
 ENV PYTHONDONTWRITEBYTECODE=1 \
    PYTHONUNBUFFERED=1 \
    PIP_NO_CACHE_DIR=off \
    PIP_DISABLE_PIP_VERSION_CHECK=1
 WORKDIR /app
 # System deps (for python-docx, Pillow, and optional external converters)
 RUN apt-get update && apt-get install -y --no-install-recommends \
    build-essential \
    libjpeg62-turbo-dev \
    libpng-dev \
    libfreetype6-dev \
    libfontconfig1-dev \
    libreoffice \
    poppler-utils \
    && rm -rf /var/lib/apt/lists/*
 # Install Python dependencies
 COPY pyproject.toml ./
 RUN pip install --upgrade pip && pip install .
 # Copy source
 COPY src/py_docx ./src/py_docx
 # Create runtime dirs
 RUN mkdir -p /templates /out /tmp/py-docx-mcp
 # Environment
 ENV DOCX_MCP_HTTP_HOST=0.0.0.0 \
    DOCX_MCP_HTTP_PORT=3000 \
    DOCX_MCP_TEMPLATES_DIR=/templates \
    DOCX_MCP_MAX_SIZE=104857600 \
    DOCX_MCP_MAX_DOCS=30 \
    DOCX_MCP_SANDBOX=true \
    DOCX_MCP_ALLOW_EXTERNAL_TOOLS=true \
    DOCX_MCP_ALLOW_NETWORK=false
 # Expose HTTP port (Streamable HTTP for OpenWebUI)
 EXPOSE 3000
 # Health check (ensure module is importable)
 HEALTHCHECK --interval=30s --timeout=5s --start-period=5s --retries=3 \
    CMD python -c "import py_docx.server; print('ok')" || exit 1
 # Default: Streamable HTTP for OpenWebUI MCP
 ENTRYPOINT ["python", "-m", "py_docx.server"]
@@ -0,0 +1,24 @@
 [build-system]
 requires = ["hatchling"]
 build-backend = "hatchling.build"
 [project]
 name = "py-docx-mcp"
 version = "0.1.0"
 description = "Python MCP server for DOCX document manipulation"
 requires-python = ">=3.10"
 dependencies = [
    "mcp>=1.0.0",
    "python-docx>=1.1.0",
    "Pillow>=10.0.0",
    "markdown>=3.5",
    "html5lib>=1.1",
    "regex>=2024.0.0",
    "aiofiles>=24.0.0",
 ]
 [project.scripts]
 py-docx-mcp = "py_docx.server:main"
 [tool.hatch.build.targets.wheel]
 packages = ["src/py_docx"]
@@ -0,0 +1 @@
 # py-docx-mcp: Python MCP server for DOCX document manipulation
@@ -0,0 +1,933 @@
 from __future__ import annotations
 import base64
 import json
 import os
 import re
 import tempfile
 import uuid
 from dataclasses import dataclass, field
 from typing import Any, Dict, List, Optional, Union
 import regex as re_lib
 from docx import Document
 from docx.shared import Inches, Pt, RGBColor
 from docx.enum.text import WD_ALIGN_PARAGRAPH
 from PIL import Image as PILImage
 from io import BytesIO
 from py_docx.security import SecurityConfig
 def file_to_result(path: str, return_content: bool = False) -> Any:
    """
    Helper: if return_content is True, read file and return {path, size, content_base64}.
    Otherwise return {path, size}.
    """
    size = os.path.getsize(path)
    if not return_content:
        return {"path": path, "size": size}
    with open(path, "rb") as f:
        data = f.read()
    b64 = base64.b64encode(data).decode("utf-8")
    return {"path": path, "size": len(data), "content_base64": b64}
@dataclass
 class DocumentMetadata:
    document_id: str
    path: str
    name: str
    size: int
    pages: int
 class DocxToolsProvider:
    def __init__(
        self,
        security_config: SecurityConfig,
        templates_dir: str,
    ):
        self.security_config = security_config
        self.templates_dir = templates_dir
        self.documents: Dict[str, Any] = {}
        self._temp_base = tempfile.mkdtemp(prefix="py_docx_mcp_")
    # ---- basic lifecycle ----
    def create_document(self) -> str:
        doc_id = str(uuid.uuid4())
        path = os.path.join(self._temp_base, f"{doc_id}.docx")
        doc = Document()
        doc.save(path)
        self.documents[doc_id] = {
            "doc": doc,
            "path": path,
            "name": "Untitled",
        }
        return doc_id
    def open_document(self, path: str) -> str:
        if not os.path.isfile(path):
            raise ValueError(f"File not found: {path}")
        doc_id = str(uuid.uuid4())
        doc = Document(path)
        self.documents[doc_id] = {
            "doc": doc,
            "path": path,
            "name": os.path.basename(path),
        }
        return doc_id
    def get_doc(self, document_id: str) -> Document:
        entry = self.documents.get(document_id)
        if not entry:
            raise ValueError(f"Document not found: {document_id}")
        return entry["doc"]
    def list_documents(self) -> List[Dict[str, Any]]:
        out = []
        for doc_id, info in self.documents.items():
            out.append({
                "document_id": doc_id,
                "name": info["name"],
                "path": info["path"],
            })
        return out
    def close_document(self, document_id: str) -> None:
        if document_id not in self.documents:
            raise ValueError("Document not found")
        del self.documents[document_id]
    # ---- content operations ----
    def add_paragraph(
        self,
        document_id: str,
        text: str,
        style: Dict[str, Any],
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        p = doc.add_paragraph(text)
        run = p.runs[0] if p.runs else p.add_run()
        font_family = style.get("font_family")
        font_size = style.get("font_size")
        bold = style.get("bold")
        italic = style.get("italic")
        underline = style.get("underline")
        color = style.get("color")
        alignment = style.get("alignment")
        if font_family:
            run.font.name = font_family
        if font_size:
            run.font.size = Pt(font_size)
        if bold is not None:
            run.bold = bool(bold)
        if italic is not None:
            run.italic = bool(italic)
        if underline is not None:
            run.underline = bool(underline)
        if color:
            try:
                run.font.color.rgb = RGBColor.from_string(color)
            except Exception:
                pass
        if alignment:
            align = alignment.lower()
            if align == "center":
                p.alignment = WD_ALIGN_PARAGRAPH.CENTER
            elif align == "right":
                p.alignment = WD_ALIGN_PARAGRAPH.RIGHT
            elif align == "justify":
                p.alignment = WD_ALIGN_PARAGRAPH.JUSTIFY
        return self._maybe_return_doc(document_id, return_content)
    def add_heading(
        self,
        document_id: str,
        text: str,
        level: int,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        level = max(0, min(6, level))
        doc.add_heading(text, level=level)
        return self._maybe_return_doc(document_id, return_content)
    def add_table(
        self,
        document_id: str,
        rows: List[List[str]],
        headers: Optional[List[str]] = None,
        border_style: Optional[str] = None,
        col_widths: Optional[List[int]] = None,
        cell_shading: Optional[str] = None,
        merges: Optional[List[Dict[str, int]]] = None,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        rows = rows or []
        if headers:
            rows = [headers] + rows
        if not rows:
            return self._maybe_return_doc(document_id, return_content)
        table = doc.add_table(rows=len(rows), cols=len(rows[0]))
        for ri, row in enumerate(rows):
            for ci, val in enumerate(row):
                table.cell(ri, ci).text = str(val or "")
        if merges:
            for m in merges:
                r = m.get("row", 0)
                c = m.get("col", 0)
                row_span = m.get("row_span", 1)
                col_span = m.get("col_span", 1)
                if row_span > 1 or col_span > 1:
                    table.cell(r, c).merge(
                        table.cell(r + row_span - 1, c + col_span - 1)
                    )
        return self._maybe_return_doc(document_id, return_content)
    def add_section_break(
        self,
        document_id: str,
        page_size: Optional[str] = None,
        orientation: Optional[str] = None,
        margins: Optional[Dict[str, float]] = None,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        doc.add_page_break()
        return self._maybe_return_doc(document_id, return_content)
    def add_list(
        self,
        document_id: str,
        items: List[str],
        ordered: bool,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        prefix = "1. " if ordered else "- "
        for item in items:
            doc.add_paragraph(f"{prefix}{item}")
        return self._maybe_return_doc(document_id, return_content)
    def add_list_item(
        self,
        document_id: str,
        text: str,
        level: int,
        ordered: bool,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        indent = "  " * level
        prefix = "1. " if ordered else "- "
        doc.add_paragraph(f"{indent}{prefix}{text}")
        return self._maybe_return_doc(document_id, return_content)
    def add_page_break(
        self,
        document_id: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        doc.add_page_break()
        return self._maybe_return_doc(document_id, return_content)
    def insert_toc(
        self,
        document_id: str,
        from_level: int = 1,
        to_level: int = 3,
        right_align_dots: bool = True,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        doc.add_paragraph("Table of Contents (placeholder)")
        return self._maybe_return_doc(document_id, return_content)
    def insert_bookmark_after_heading(
        self,
        document_id: str,
        heading_text: str,
        name: str,
        return_content: bool = False,
    ) -> Any:
        # python-docx does not expose bookmarks easily; placeholder.
        return self._maybe_return_doc(document_id, return_content)
    def set_header(
        self,
        document_id: str,
        text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        section = doc.sections[0]
        header = section.header
        header.paragraphs[0].text = text
        return self._maybe_return_doc(document_id, return_content)
    def set_footer(
        self,
        document_id: str,
        text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        section = doc.sections[0]
        footer = section.footer
        footer.paragraphs[0].text = text
        return self._maybe_return_doc(document_id, return_content)
    def set_page_numbering(
        self,
        document_id: str,
        location: str,
        template: Optional[str] = None,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        section = doc.sections[0]
        target = section.footer if location == "footer" else section.header
        target.paragraphs[0].text = template or "Page {PAGE} of {PAGES}"
        return self._maybe_return_doc(document_id, return_content)
    def embed_page_number_fields(
        self,
        document_id: str,
        return_content: bool = False,
    ) -> Any:
        # python-docx cannot easily inject raw field codes; no-op placeholder.
        return self._maybe_return_doc(document_id, return_content)
    def add_image(
        self,
        document_id: str,
        data_base64: str,
        width: Optional[int] = None,
        height: Optional[int] = None,
        alt_text: Optional[str] = None,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        img_data = base64.b64decode(data_base64)
        img = PILImage.open(BytesIO(img_data))
        tmp_path = "/tmp/py_docx_temp.png"
        img.save(tmp_path, format="PNG")
        doc.add_picture(
            tmp_path,
            width=Inches(width / 96.0) if width else None,
            height=Inches(height / 96.0) if height else None,
        )
        return self._maybe_return_doc(document_id, return_content)
    def add_hyperlink(
        self,
        document_id: str,
        text: str,
        url: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        doc.add_paragraph(f"{text} ({url})")
        return self._maybe_return_doc(document_id, return_content)
    def find_and_replace(
        self,
        document_id: str,
        find_text: str,
        replace_text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        count = 0
        for para in doc.paragraphs:
            if find_text in para.text:
                para.text = para.text.replace(find_text, replace_text)
                count += para.text.count(replace_text)
        return {
            "success": True,
            "replacements": count,
            "document": self._maybe_return_doc(document_id, return_content),
        }
    def find_and_replace_advanced(
        self,
        document_id: str,
        pattern: str,
        replacement: str,
        case_sensitive: bool,
        whole_word: bool,
        use_regex: bool,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        count = 0
        for para in doc.paragraphs:
            original = para.text
            if use_regex:
                flags = 0 if case_sensitive else re_lib.IGNORECASE
                pat = pattern
            else:
                if whole_word:
                    pat = r"\b" + re_lib.escape(pattern) + r"\b"
                else:
                    pat = re_lib.escape(pattern)
                flags = 0 if case_sensitive else re_lib.IGNORECASE
            new_text, n = re_lib.subn(pat, replacement, original, flags=flags)
            if new_text != original:
                para.text = new_text
                count += n
        return {
            "success": True,
            "replacements": count,
            "document": self._maybe_return_doc(document_id, return_content),
        }
    def apply_paragraph_format(
        self,
        document_id: str,
        contains: Optional[str],
        format: Dict[str, Any],
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        updated = 0
        for para in doc.paragraphs:
            if contains and (contains not in para.text):
                continue
            for run in para.runs or []:
                if "font_family" in format:
                    run.font.name = format["font_family"]
                if "font_size" in format:
                    run.font.size = Pt(int(format["font_size"]))
                if "bold" in format:
                    run.bold = bool(format["bold"])
                if "italic" in format:
                    run.italic = bool(format["italic"])
                if "underline" in format:
                    run.underline = bool(format["underline"])
                if "color" in format:
                    try:
                        run.font.color.rgb = RGBColor.from_string(format["color"])
                    except Exception:
                        pass
            updated += 1
        return {
            "success": True,
            "paragraphs_updated": updated,
            "document": self._maybe_return_doc(document_id, return_content),
        }
    def extract_text(self, document_id: str) -> str:
        doc = self.get_doc(document_id)
        return "\n".join(p.text for p in doc.paragraphs)
    def get_tables(self, document_id: str) -> List[Dict[str, Any]]:
        doc = self.get_doc(document_id)
        out = []
        for idx, table in enumerate(doc.tables):
            rows_data = []
            for row in table.rows:
                cells = [cell.text for cell in row.cells]
                rows_data.append(cells)
            out.append({
                "index": idx,
                "rows": len(table.rows),
                "cols": len(table.columns),
                "data": rows_data,
            })
        return out
    def list_images(self, document_id: str) -> List[Dict[str, Any]]:
        return []
    def list_hyperlinks(self, document_id: str) -> List[Dict[str, Any]]:
        doc = self.get_doc(document_id)
        links = []
        for p in doc.paragraphs:
            for m in re.finditer(r"\((https?://\S+)\)", p.text):
                links.append({"text": p.text.strip(), "url": m.group(1)})
        return links
    def get_fields_summary(self, document_id: str) -> Dict[str, Any]:
        return {"note": "Fields summary not fully implemented in Python version"}
    def strip_personal_info(self, document_id: str) -> None:
        doc = self.get_doc(document_id)
        core = doc.core_properties
        core.author = ""
        core.last_modified_by = ""
        core.revision_number = 1
    def get_metadata(self, document_id: str) -> DocumentMetadata:
        info = self.documents[document_id]
        path = info["path"]
        size = os.path.getsize(path)
        doc = info["doc"]
        pages = max(1, len(doc.paragraphs) // 40)
        return DocumentMetadata(
            document_id=document_id,
            path=path,
            name=info["name"],
            size=size,
            pages=pages,
        )
    def save_document(
        self,
        document_id: str,
        output_path: str,
        return_content: bool = True,
    ) -> Any:
        info = self.documents[document_id]
        os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
        info["doc"].save(output_path)
        return file_to_result(output_path, return_content=return_content)
    # ---- conversion (best-effort, external tools optional) ----
    def convert_to_pdf(
        self,
        document_id: str,
        output_path: str,
        prefer_external: bool = False,
        return_content: bool = True,
    ) -> Any:
        meta = self.get_metadata(document_id)
        # If external tools are allowed, you can call LibreOffice here;
        # for now, we indicate requirement.
        if prefer_external:
            raise NotImplementedError(
                "External PDF conversion not yet wired; "
                "configure LibreOffice/unoconv integration."
            )
        raise NotImplementedError(
            "PDF conversion not yet implemented in pure Python version."
        )
    def export_pdf_with_field_refresh(
        self,
        document_id: str,
        output_path: str,
        prefer_external: bool = True,
        return_content: bool = True,
    ) -> Any:
        self.embed_page_number_fields(document_id)
        return self.convert_to_pdf(document_id, output_path, prefer_external, return_content=return_content)
    def convert_to_images(
        self,
        document_id: str,
        output_dir: str,
        format: str = "png",
        dpi: int = 150,
        return_content: bool = True,
    ) -> Any:
        raise NotImplementedError(
            "Image conversion not yet implemented in pure Python version."
        )
    def convert_to_images_with_preference(
        self,
        document_id: str,
        output_dir: str,
        format: str = "png",
        dpi: int = 150,
        prefer_external: bool = True,
        return_content: bool = True,
    ) -> Any:
        return self.convert_to_images(document_id, output_dir, format, dpi, return_content=return_content)
    # ---- advanced docx operations ----
    def merge_documents(
        self,
        document_ids: List[str],
        output_path: str,
        return_content: bool = True,
    ) -> Any:
        merged = Document()
        for did in document_ids:
            doc = self.get_doc(did)
            for elem in doc.element.body:
                merged.element.body.append(elem)
        os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
        merged.save(output_path)
        return file_to_result(output_path, return_content=return_content)
    def split_document(
        self,
        document_id: str,
        output_dir: str,
        return_content: bool = True,
    ) -> Any:
        # Very naive: split by page breaks.
        doc = self.get_doc(document_id)
        os.makedirs(output_dir, exist_ok=True)
        parts: List[Document] = []
        current = Document()
        for elem in doc.element.body:
            tag = elem.tag
            if "lastRenderedPageBreak" in tag or "pageBreakBefore" in tag:
                parts.append(current)
                current = Document()
            else:
                current.element.body.append(elem)
        if len(current.element.body) > 0:
            parts.append(current)
        results = []
        for i, pdoc in enumerate(parts):
            path = os.path.join(output_dir, f"part_{i}.docx")
            pdoc.save(path)
            results.append(file_to_result(path, return_content=return_content))
        return {"parts": results}
    def get_document_structure(self, document_id: str) -> Dict[str, Any]:
        doc = self.get_doc(document_id)
        headings = []
        for p in doc.paragraphs:
            if p.style.name.startswith("Heading"):
                headings.append({
                    "text": p.text,
                    "style": p.style.name,
                })
        return {
            "headings": headings,
            "paragraph_count": len(doc.paragraphs),
            "table_count": len(doc.tables),
        }
    def get_outline(self, document_id: str) -> List[Dict[str, Any]]:
        return self.get_document_structure(document_id).get("headings", [])
    def get_ranges(self, document_id: str, selector: str) -> List[Dict[str, Any]]:
        # Minimal: "heading:'Text'" or "paragraph[i]"
        doc = self.get_doc(document_id)
        ranges = []
        if selector.startswith("heading:"):
            target = selector[len("heading:"):].strip().strip("'\"")
            for i, p in enumerate(doc.paragraphs):
                if p.style.name.startswith("Heading") and target.lower() in p.text.lower():
                    ranges.append({"type": "paragraph", "index": i})
        elif selector.startswith("paragraph["):
            m = re.match(r"paragraph\[(\d+)\]", selector)
            if m:
                idx = int(m.group(1))
                ranges.append({"type": "paragraph", "index": idx})
        return ranges
    def replace_range_text(
        self,
        document_id: str,
        range_id: Dict[str, Any],
        text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        if range_id.get("type") == "paragraph":
            idx = range_id.get("index")
            if 0 <= idx < len(doc.paragraphs):
                doc.paragraphs[idx].text = text
        return self._maybe_return_doc(document_id, return_content)
    def set_table_cell_text(
        self,
        document_id: str,
        table_index: int,
        row: int,
        col: int,
        text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        table = doc.tables[table_index]
        table.cell(row, col).text = text
        return self._maybe_return_doc(document_id, return_content)
    def get_document_properties(self, document_id: str) -> Dict[str, Any]:
        doc = self.get_doc(document_id)
        core = doc.core_properties
        return {
            "title": core.title,
            "subject": core.subject,
            "author": core.author,
            "last_modified_by": core.last_modified_by,
            "created": str(core.created),
            "modified": str(core.modified),
        }
    def set_document_properties(
        self,
        document_id: str,
        title: Optional[str],
        subject: Optional[str],
        author: Optional[str],
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        core = doc.core_properties
        if title is not None:
            core.title = title
        if subject is not None:
            core.subject = subject
        if author is not None:
            core.author = author
        return self._maybe_return_doc(document_id, return_content)
    def insert_after_heading(
        self,
        document_id: str,
        heading_text: str,
        text: str,
        return_content: bool = False,
    ) -> Any:
        doc = self.get_doc(document_id)
        for p in doc.paragraphs:
            if p.style.name.startswith("Heading") and heading_text.lower() in p.text.lower():
                doc.add_paragraph(text)
                return self._maybe_return_doc(document_id, return_content)
        return {"success": False, "reason": "Heading not found"}
    def sanitize_external_links(self, document_id: str) -> None:
        # naive: remove URLs from text
        doc = self.get_doc(document_id)
        for p in doc.paragraphs:
            p.text = re.sub(r"(https?://\S+)", "", p.text)
    def redact_text(
        self,
        document_id: str,
        pattern: str,
        use_regex: bool = False,
        whole_word: bool = False,
        case_sensitive: bool = False,
        return_content: bool = False,
    ) -> Any:
        result = self.find_and_replace_advanced(
            document_id,
            pattern=pattern,
            replacement="█",
            case_sensitive=case_sensitive,
            whole_word=whole_word,
            use_regex=use_regex,
            return_content=return_content,
        )
        return result
    def analyze_formatting(self, document_id: str) -> Dict[str, Any]:
        doc = self.get_doc(document_id)
        styles = set()
        fonts = set()
        for p in doc.paragraphs:
            styles.add(p.style.name)
            for run in p.runs or []:
                if run.font.name:
                    fonts.add(run.font.name)
        return {
            "styles_used": list(styles),
            "fonts_detected": list(fonts),
            "has_tables": len(doc.tables) > 0,
            "has_images": False,
            "has_hyperlinks": any(
                "http" in p.text.lower() for p in doc.paragraphs
            ),
            "page_count": max(1, len(doc.paragraphs) // 40),
            "section_count": len(doc.sections),
        }
    def get_word_count(self, document_id: str) -> Dict[str, Any]:
        text = self.extract_text(document_id)
        words = text.split()
        chars = len(text)
        chars_no_spaces = len(text.replace(" ", ""))
        paragraphs = len([l for l in text.splitlines() if l.strip()])
        sentences = len(re.findall(r"[.!?]+", text))
        return {
            "words": len(words),
            "characters": chars,
            "characters_no_spaces": chars_no_spaces,
            "paragraphs": paragraphs,
            "sentences": sentences,
            "pages": max(1, len(words) // 250),
            "reading_time_minutes": max(1, len(words) // 200),
        }
    def search_text(
        self,
        document_id: str,
        search_term: str,
        case_sensitive: bool = False,
        whole_word: bool = False,
    ) -> Dict[str, Any]:
        text = self.extract_text(document_id)
        if not case_sensitive:
            text_lower = text.lower()
            term_lower = search_term.lower()
        else:
            text_lower = text
            term_lower = search_term
        if whole_word:
            pattern = r"\b" + re_lib.escape(term_lower) + r"\b"
        else:
            pattern = re_lib.escape(term_lower)
        matches = []
        for m in re_lib.finditer(pattern, text_lower):
            start = max(0, m.start() - 50)
            end = min(len(text), m.end() + 50)
            line = text[: m.start()].count("\n") + 1
            matches.append({
                "position": m.start(),
                "context": text[start:end],
                "line": line,
            })
        return {
            "matches": matches,
            "total_matches": len(matches),
        }
    def export_to_markdown(
        self,
        document_id: str,
        output_path: str,
        return_content: bool = True,
    ) -> Any:
        text = self.extract_text(document_id)
        md_lines = []
        for line in text.splitlines():
            t = line.strip()
            if not t:
                md_lines.append("")
                continue
            if len(t) < 100 and any(c.isupper() for c in t):
                if all(c.isupper() or c.isspace() for c in t):
                    md_lines.append(f"# {t}")
                else:
                    md_lines.append(f"## {t}")
            else:
                md_lines.append(t)
        md = "\n\n".join(md_lines)
        os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
        with open(output_path, "w", encoding="utf-8") as f:
            f.write(md)
        return file_to_result(output_path, return_content=return_content)
    def export_to_html(
        self,
        document_id: str,
        output_path: str,
        return_content: bool = True,
    ) -> Any:
        text = self.extract_text(document_id)
        html_parts = ['<html><head><meta charset="utf-8"></head><body>\n']
        for line in text.splitlines():
            t = line.strip()
            if not t:
                continue
            if len(t) < 100 and any(c.isupper() for c in t):
                if all(c.isupper() or c.isspace() for c in t):
                    html_parts.append(f"<h1>{t}</h1>")
                else:
                    html_parts.append(f"<h2>{t}</h2>")
            elif t.startswith("- ") or t.startswith("* "):
                html_parts.append(f"<ul><li>{t[2:]}</li></ul>")
            else:
                html_parts.append(f"<p>{t}</p>")
        html_parts.append("</body></html>\n")
        html = "\n".join(html_parts)
        os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
        with open(output_path, "w", encoding="utf-8") as f:
            f.write(html)
        return file_to_result(output_path, return_content=return_content)
    # ---- security and storage info ----
    def get_security_info(self) -> Dict[str, Any]:
        return {
            "readonly_mode": self.security_config.readonly_mode,
            "sandbox_mode": self.security_config.sandbox_mode,
            "allow_external_tools": self.security_config.allow_external_tools,
            "allow_network": self.security_config.allow_network,
            "max_document_size": self.security_config.max_document_size,
            "max_open_documents": self.security_config.max_open_documents,
        }
    def get_storage_info(self) -> Dict[str, Any]:
        total = 0
        for info in self.documents.values():
            try:
                total += os.path.getsize(info["path"])
            except OSError:
                pass
        return {
            "temp_base": self._temp_base,
            "open_documents": len(self.documents),
            "total_size_bytes": total,
        }
    # ---- templates ----
    def open_template(self, name: str, templates_dir: str) -> str:
        path = os.path.join(templates_dir, name)
        if not os.path.isfile(path):
            raise ValueError(f"Template not found: {name}")
        return self.open_document(path)
    def generate_from_template(
        self,
        template_name: str,
        output_path: str,
        fields: Dict[str, str],
        return_content: bool = True,
    ) -> Any:
        template_path = os.path.join(self.templates_dir, template_name)
        if not os.path.isfile(template_path):
            raise ValueError(f"Template not found: {template_name}")
        doc_id = self.open_document(template_path)
        for key, value in fields.items():
            placeholder = "{{" + key + "}}"
            self.find_and_replace_advanced(
                doc_id,
                pattern=placeholder,
                replacement=str(value),
                case_sensitive=False,
                whole_word=True,
                use_regex=False,
                return_content=False,
            )
        self.save_document(doc_id, output_path, return_content=False)
        self.close_document(doc_id)
        return file_to_result(output_path, return_content=return_content)
    # ---- internal helper ----
    def _maybe_return_doc(
        self,
        document_id: str,
        return_content: bool,
    ) -> Any:
        """
        If return_content is True, save the current document in-memory state
        to its path and return base64 content.
        """
        if not return_content:
            return {"success": True, "document_id": document_id}
        info = self.documents[document_id]
        info["doc"].save(info["path"])
        return file_to_result(info["path"], return_content=True)
@@ -0,0 +1,96 @@
 from __future__ import annotations
 from dataclasses import dataclass
 from typing import Set
@dataclass
 class SecurityConfig:
    readonly_mode: bool
    sandbox_mode: bool
    allow_external_tools: bool
    allow_network: bool
    max_document_size: int
    max_open_documents: int
    def get_summary(self) -> str:
        parts = []
        if self.readonly_mode:
            parts.append("readonly")
        if self.sandbox_mode:
            parts.append("sandbox")
        if self.allow_external_tools:
            parts.append("external-tools")
        if self.allow_network:
            parts.append("network")
        return ", ".join(parts) or "default"
 # Tools allowed in readonly mode
 READONLY_COMMANDS: Set[str] = {
    "list_documents",
    "open_document",
    "extract_text",
    "get_metadata",
    "get_document_structure",
    "get_outline",
    "get_ranges",
    "get_tables",
    "list_images",
    "list_hyperlinks",
    "get_fields_summary",
    "get_document_properties",
    "get_word_count",
    "search_text",
    "analyze_formatting",
    "get_security_info",
    "get_storage_info",
    "list_templates",
 }
 # Tools that modify documents
 WRITE_COMMANDS: Set[str] = {
    "create_document",
    "add_paragraph",
    "add_heading",
    "add_table",
    "add_section_break",
    "add_list",
    "add_list_item",
    "add_page_break",
    "insert_toc",
    "insert_bookmark_after_heading",
    "set_header",
    "set_footer",
    "set_page_numbering",
    "embed_page_number_fields",
    "add_image",
    "add_hyperlink",
    "find_and_replace",
    "find_and_replace_advanced",
    "apply_paragraph_format",
    "save_document",
    "close_document",
    "convert_to_pdf",
    "export_pdf_with_field_refresh",
    "convert_to_images",
    "convert_to_images_with_preference",
    "merge_documents",
    "split_document",
    "replace_range_text",
    "set_table_cell_text",
    "set_document_properties",
    "insert_after_heading",
    "sanitize_external_links",
    "redact_text",
    "strip_personal_info",
    "export_to_markdown",
    "export_to_html",
    "open_template",
    "generate_from_template",
 }
 def is_command_allowed(name: str, config: SecurityConfig) -> bool:
    if config.readonly_mode:
        return name in READONLY_COMMANDS
    return True
@@ -0,0 +1,709 @@
 from __future__ import annotations
 import json
 import logging
 import os
 import sys
 from typing import Any
 from mcp.server.fastmcp import FastMCP
 import uvicorn
 from py_docx.docx_tools import DocxToolsProvider
 from py_docx.security import SecurityConfig, is_command_allowed
 from py_docx.templates import list_templates
 logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s [%(levelname)s] %(name)s: %(message)s",
 )
 logger = logging.getLogger("py-docx-mcp")
 TEMPLATES_DIR = os.getenv("DOCX_MCP_TEMPLATES_DIR", "/templates")
 class ApiKeyAuthMiddleware:
    """
    Simple ASGI middleware that enforces an API key if configured.
    Accepts:
      - Authorization: Bearer <key>
      - X-API-Key: <key>
    """
    def __init__(self, app, api_key: str):
        self.app = app
        self.api_key = api_key
    async def __call__(self, scope, receive, send):
        if scope["type"] != "http":
            await self.app(scope, receive, send)
            return
        headers = {k.decode("utf-8").lower(): v.decode("utf-8") for k, v in scope.get("headers", [])}
        auth = headers.get("authorization", "")
        api_key_header = headers.get("x-api-key", "")
        provided = ""
        if auth.startswith("Bearer "):
            provided = auth[len("Bearer "):].strip()
        elif api_key_header:
            provided = api_key_header.strip()
        if provided != self.api_key:
            await send(
                {
                    "type": "http.response.start",
                    "status": 401,
                    "headers": [(b"content-type", b"application/json")],
                }
            )
            await send(
                {
                    "type": "http.response.body",
                    "body": json.dumps({"error": "Invalid or missing API key"}).encode("utf-8"),
                }
            )
            return
        await self.app(scope, receive, send)
 def make_server(
    readonly_mode: bool = False,
    sandbox_mode: bool = False,
    allow_external_tools: bool = False,
    allow_network: bool = False,
    max_document_size: int = 100 * 1024 * 1024,
    max_open_documents: int = 30,
 ) -> FastMCP:
    mcp = FastMCP(
        "py-docx-mcp",
        instructions="DOCX tools for reading and exporting via MCP (Python, Streamable HTTP)",
    )
    security_config = SecurityConfig(
        readonly_mode=readonly_mode,
        sandbox_mode=sandbox_mode,
        allow_external_tools=allow_external_tools,
        allow_network=allow_network,
        max_document_size=max_document_size,
        max_open_documents=max_open_documents,
    )
    provider = DocxToolsProvider(
        security_config=security_config,
        templates_dir=TEMPLATES_DIR,
    )
    def wrap(fn, name: str):
        def wrapper(**kwargs):
            if not is_command_allowed(name, security_config):
                raise ValueError(f"Command '{name}' not allowed by security policy")
            return fn(**kwargs)
        wrapper.__name__ = fn.__name__
        return wrapper
    # Core document operations
    mcp.tool()(
        wrap(lambda: provider.create_document(), "create_document"),
        name="create_document",
        description="Create a new empty DOCX document",
    )
    mcp.tool()(
        wrap(lambda path: provider.open_document(path), "open_document"),
        name="open_document",
        description="Open an existing DOCX document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, style=None, return_content=False: provider.add_paragraph(
                document_id, text, style or {}, return_content=return_content
            ),
            "add_paragraph",
        ),
        name="add_paragraph",
        description="Add a paragraph with optional styling to the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, level, return_content=False: provider.add_heading(
                document_id, text, level, return_content=return_content
            ),
            "add_heading",
        ),
        name="add_heading",
        description="Add a heading to the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, rows, headers=None, border_style=None, col_widths=None, cell_shading=None, merges=None, return_content=False: provider.add_table(
                document_id,
                rows,
                headers=headers,
                border_style=border_style,
                col_widths=col_widths,
                cell_shading=cell_shading,
                merges=merges,
                return_content=return_content,
            ),
            "add_table",
        ),
        name="add_table",
        description="Add a table to the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, page_size=None, orientation=None, margins=None, return_content=False: provider.add_section_break(
                document_id, page_size, orientation, margins or {}, return_content=return_content
            ),
            "add_section_break",
        ),
        name="add_section_break",
        description="Insert a section break with optional page setup",
    )
    mcp.tool()(
        wrap(
            lambda document_id, items, ordered=False, return_content=False: provider.add_list(
                document_id, items, ordered, return_content=return_content
            ),
            "add_list",
        ),
        name="add_list",
        description="Add a bulleted or numbered list to the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, level=0, ordered=False, return_content=False: provider.add_list_item(
                document_id, text, level, ordered, return_content=return_content
            ),
            "add_list_item",
        ),
        name="add_list_item",
        description="Add a single list item with a specific level",
    )
    mcp.tool()(
        wrap(
            lambda document_id, return_content=False: provider.add_page_break(document_id, return_content=return_content),
            "add_page_break",
        ),
        name="add_page_break",
        description="Add a page break to the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, from_level=1, to_level=3, right_align_dots=True, return_content=False: provider.insert_toc(
                document_id, from_level, to_level, right_align_dots, return_content=return_content
            ),
            "insert_toc",
        ),
        name="insert_toc",
        description="Insert a Table of Contents placeholder",
    )
    mcp.tool()(
        wrap(
            lambda document_id, heading_text, name, return_content=False: provider.insert_bookmark_after_heading(
                document_id, heading_text, name, return_content=return_content
            ),
            "insert_bookmark_after_heading",
        ),
        name="insert_bookmark_after_heading",
        description="Insert a bookmark immediately after the first matching heading",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, return_content=False: provider.set_header(document_id, text, return_content=return_content),
            "set_header",
        ),
        name="set_header",
        description="Set the document header",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, return_content=False: provider.set_footer(document_id, text, return_content=return_content),
            "set_footer",
        ),
        name="set_footer",
        description="Set the document footer",
    )
    mcp.tool()(
        wrap(
            lambda document_id, location="footer", template=None, return_content=False: provider.set_page_numbering(
                document_id, location, template, return_content=return_content
            ),
            "set_page_numbering",
        ),
        name="set_page_numbering",
        description="Set a simple page numbering text in header or footer",
    )
    mcp.tool()(
        wrap(
            lambda document_id, return_content=False: provider.embed_page_number_fields(document_id, return_content=return_content),
            "embed_page_number_fields",
        ),
        name="embed_page_number_fields",
        description="Replace placeholder 'Page {PAGE} of {PAGES}' with Word field codes (best-effort)",
    )
    mcp.tool()(
        wrap(
            lambda document_id, data_base64, width=None, height=None, alt_text=None, return_content=False: provider.add_image(
                document_id, data_base64, width, height, alt_text, return_content=return_content
            ),
            "add_image",
        ),
        name="add_image",
        description="Insert an image into the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, text, url, return_content=False: provider.add_hyperlink(
                document_id, text, url, return_content=return_content
            ),
            "add_hyperlink",
        ),
        name="add_hyperlink",
        description="Insert a hyperlink into the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, find_text, replace_text, return_content=False: provider.find_and_replace(
                document_id, find_text, replace_text, return_content=return_content
            ),
            "find_and_replace",
        ),
        name="find_and_replace",
        description="Find and replace text in the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, pattern, replacement, case_sensitive=False, whole_word=False, use_regex=False, return_content=False: provider.find_and_replace_advanced(
                document_id, pattern, replacement, case_sensitive, whole_word, use_regex, return_content=return_content
            ),
            "find_and_replace_advanced",
        ),
        name="find_and_replace_advanced",
        description="Find/replace with regex, case, whole-word, preserving runs",
    )
    mcp.tool()(
        wrap(
            lambda document_id, contains=None, format=None, return_content=False: provider.apply_paragraph_format(
                document_id, contains, format or {}, return_content=return_content
            ),
            "apply_paragraph_format",
        ),
        name="apply_paragraph_format",
        description="Apply paragraph formatting to paragraphs matching a simple selector",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.extract_text(document_id),
            "extract_text",
        ),
        name="extract_text",
        description="Extract all text content from the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_tables(document_id),
            "get_tables",
        ),
        name="get_tables",
        description="List tables with dimensions, merges, and cell content",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.list_images(document_id),
            "list_images",
        ),
        name="list_images",
        description="List images with width/height and alt text",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.list_hyperlinks(document_id),
            "list_hyperlinks",
        ),
        name="list_hyperlinks",
        description="List hyperlinks in the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_fields_summary(document_id),
            "get_fields_summary",
        ),
        name="get_fields_summary",
        description="Summarize Word fields (PAGE, NUMPAGES, TOC) in document and headers/footers",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.strip_personal_info(document_id),
            "strip_personal_info",
        ),
        name="strip_personal_info",
        description="Remove personal info from metadata and core.xml (best-effort)",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_metadata(document_id),
            "get_metadata",
        ),
        name="get_metadata",
        description="Get document metadata",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_path, return_content=True: provider.save_document(
                document_id, output_path, return_content=return_content
            ),
            "save_document",
        ),
        name="save_document",
        description="Save the document to a specific path and return its content",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.close_document(document_id),
            "close_document",
        ),
        name="close_document",
        description="Close the document and free resources",
    )
    mcp.tool()(
        wrap(
            lambda: provider.list_documents(),
            "list_documents",
        ),
        name="list_documents",
        description="List all open documents",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_path, prefer_external=False, return_content=True: provider.convert_to_pdf(
                document_id, output_path, prefer_external, return_content=return_content
            ),
            "convert_to_pdf",
        ),
        name="convert_to_pdf",
        description="Convert a DOCX document to PDF and return the file",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_path, prefer_external=True, return_content=True: provider.export_pdf_with_field_refresh(
                document_id, output_path, prefer_external, return_content=return_content
            ),
            "export_pdf_with_field_refresh",
        ),
        name="export_pdf_with_field_refresh",
        description="Embed page fields then export to PDF (hi-fidelity when available)",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_dir, format="png", dpi=150, return_content=True: provider.convert_to_images(
                document_id, output_dir, format, dpi, return_content=return_content
            ),
            "convert_to_images",
        ),
        name="convert_to_images",
        description="Convert a DOCX document to images (one per page) and return them",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_dir, format="png", dpi=150, prefer_external=True, return_content=True: provider.convert_to_images_with_preference(
                document_id, output_dir, format, dpi, prefer_external, return_content=return_content
            ),
            "convert_to_images_with_preference",
        ),
        name="convert_to_images_with_preference",
        description="Convert DOCX to images, preferring external hi-fidelity path",
    )
    mcp.tool()(
        wrap(
            lambda document_ids, output_path, return_content=True: provider.merge_documents(
                document_ids, output_path, return_content=return_content
            ),
            "merge_documents",
        ),
        name="merge_documents",
        description="Merge multiple DOCX documents into one and return the result",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_dir, return_content=True: provider.split_document(
                document_id, output_dir, return_content=return_content
            ),
            "split_document",
        ),
        name="split_document",
        description="Split a document at page breaks and return parts",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_document_structure(document_id),
            "get_document_structure",
        ),
        name="get_document_structure",
        description="Get the structural overview of the document (headings, sections, etc.)",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_outline(document_id),
            "get_outline",
        ),
        name="get_outline",
        description="Return heading outline with range_ids",
    )
    mcp.tool()(
        wrap(
            lambda document_id, selector: provider.get_ranges(document_id, selector),
            "get_ranges",
        ),
        name="get_ranges",
        description="Resolve a selector to range_ids",
    )
    mcp.tool()(
        wrap(
            lambda document_id, range_id, text, return_content=False: provider.replace_range_text(
                document_id, range_id, text, return_content=return_content
            ),
            "replace_range_text",
        ),
        name="replace_range_text",
        description="Replace text in a paragraph/heading by range_id",
    )
    mcp.tool()(
        wrap(
            lambda document_id, table_index, row, col, text, return_content=False: provider.set_table_cell_text(
                document_id, table_index, row, col, text, return_content=return_content
            ),
            "set_table_cell_text",
        ),
        name="set_table_cell_text",
        description="Set text in a table cell by indices",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_document_properties(document_id),
            "get_document_properties",
        ),
        name="get_document_properties",
        description="Get document properties (title, subject, author, timestamps)",
    )
    mcp.tool()(
        wrap(
            lambda document_id, title=None, subject=None, author=None, return_content=False: provider.set_document_properties(
                document_id, title, subject, author, return_content=return_content
            ),
            "set_document_properties",
        ),
        name="set_document_properties",
        description="Set document properties (title, subject, author)",
    )
    mcp.tool()(
        wrap(
            lambda document_id, heading_text, text, return_content=False: provider.insert_after_heading(
                document_id, heading_text, text, return_content=return_content
            ),
            "insert_after_heading",
        ),
        name="insert_after_heading",
        description="Insert a paragraph after the first heading that matches text",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.sanitize_external_links(document_id),
            "sanitize_external_links",
        ),
        name="sanitize_external_links",
        description="Remove external hyperlinks (http/https)",
    )
    mcp.tool()(
        wrap(
            lambda document_id, pattern, use_regex=False, whole_word=False, case_sensitive=False, return_content=False: provider.redact_text(
                document_id, pattern, use_regex, whole_word, case_sensitive, return_content=return_content
            ),
            "redact_text",
        ),
        name="redact_text",
        description="Redact text using regex/whole-word with █ character",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.analyze_formatting(document_id),
            "analyze_formatting",
        ),
        name="analyze_formatting",
        description="Analyze the formatting used throughout the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id: provider.get_word_count(document_id),
            "get_word_count",
        ),
        name="get_word_count",
        description="Get detailed word count statistics for the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, search_term, case_sensitive=False, whole_word=False: provider.search_text(
                document_id, search_term, case_sensitive, whole_word
            ),
            "search_text",
        ),
        name="search_text",
        description="Search for text patterns in the document",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_path, return_content=True: provider.export_to_markdown(
                document_id, output_path, return_content=return_content
            ),
            "export_to_markdown",
        ),
        name="export_to_markdown",
        description="Export document content to Markdown format and return the file",
    )
    mcp.tool()(
        wrap(
            lambda document_id, output_path, return_content=True: provider.export_to_html(
                document_id, output_path, return_content=return_content
            ),
            "export_to_html",
        ),
        name="export_to_html",
        description="Export document content to HTML format and return the file",
    )
    mcp.tool()(
        wrap(
            lambda: provider.get_security_info(),
            "get_security_info",
        ),
        name="get_security_info",
        description="Get information about current security settings and restrictions",
    )
    mcp.tool()(
        wrap(
            lambda: provider.get_storage_info(),
            "get_storage_info",
        ),
        name="get_storage_info",
        description="Get information about temporary storage usage",
    )
    mcp.tool()(
        wrap(
            lambda: list_templates(TEMPLATES_DIR),
            "list_templates",
        ),
        name="list_templates",
        description="List available document templates from the templates directory",
    )
    mcp.tool()(
        wrap(
            lambda name: provider.open_template(name, TEMPLATES_DIR),
            "open_template",
        ),
        name="open_template",
        description="Open a template document by name from the templates directory",
    )
    mcp.tool()(
        wrap(
            lambda template_name, output_path, fields=None, return_content=True: provider.generate_from_template(
                template_name, output_path, fields or {}, return_content=return_content
            ),
            "generate_from_template",
        ),
        name="generate_from_template",
        description="Generate a new document from a template and return the file",
    )
    return mcp
 def main():
    readonly_mode = os.getenv("DOCX_MCP_READONLY", "false").lower() in ("true", "1")
    sandbox_mode = os.getenv("DOCX_MCP_SANDBOX", "true").lower() in ("true", "1")
    allow_external_tools = os.getenv("DOCX_MCP_ALLOW_EXTERNAL_TOOLS", "false").lower() in ("true", "1")
    allow_network = os.getenv("DOCX_MCP_ALLOW_NETWORK", "false").lower() in ("true", "1")
    max_document_size = int(os.getenv("DOCX_MCP_MAX_SIZE", "104857600"))
    max_open_documents = int(os.getenv("DOCX_MCP_MAX_DOCS", "30"))
    api_key = os.getenv("DOCX_MCP_API_KEY", "").strip()
    mcp = make_server(
        readonly_mode=readonly_mode,
        sandbox_mode=sandbox_mode,
        allow_external_tools=allow_external_tools,
        allow_network=allow_network,
        max_document_size=max_document_size,
        max_open_documents=max_open_documents,
    )
    # Build ASGI app (FastMCP exposes to_asgi_app in current SDKs)
    app = mcp.to_asgi_app()
    # Apply API key auth if configured
    if api_key:
        app = ApiKeyAuthMiddleware(app, api_key)
    host = os.getenv("DOCX_MCP_HTTP_HOST", "0.0.0.0")
    port = int(os.getenv("DOCX_MCP_HTTP_PORT", "3000"))
    # Run with uvicorn (Streamable HTTP transport for OpenWebUI)
    uvicorn.run(app, host=host, port=port, log_level="info")
 if __name__ == "__main__":
    main()
@@ -0,0 +1,22 @@
 from __future__ import annotations
 import os
 from typing import List
 def list_templates(templates_dir: str) -> dict:
    if not os.path.isdir(templates_dir):
        return {"templates": []}
    templates: List[str] = []
    for entry in os.listdir(templates_dir):
        path = os.path.join(templates_dir, entry)
        if os.path.isfile(path) and entry.lower().endswith(".docx"):
            templates.append(entry)
    templates.sort()
    return {"templates": templates}
 def open_template_path(templates_dir: str, name: str) -> str:
    path = os.path.join(templates_dir, name)
    if not os.path.isfile(path):
        raise ValueError(f"Template not found: {name}")
    return path
		`@@ -0,0 +1 @@`
							`# py-docx-mcp: Python MCP server for DOCX document manipulation`