mcp-pdf-tools/pyproject.toml
Ryan Malloy 4090c788a2
Some checks failed
Security Scan / security-scan (push) Has been cancelled
Strip operator-private files from sdist + add structural defense
The PII audit run before this publish caught three files that have been
leaking operator-specific paths to PyPI in v2.1.6, v2.1.7, and v2.2.0:

- claude_desktop_config.json (personal Claude Desktop config snapshot)
- mcp-pdf-tools-launcher.sh (obsolete — uvx replaces it)
- mcp-config-example.json (had hardcoded /home/rpm path + old package name)

Fix:
- Delete the personal config and obsolete launcher
- Sanitize the example to use uvx with the [markdown] extra (matches docs)
- Add [tool.hatch.build.targets.sdist] exclude block per
  ~/.claude/rules/python.md to prevent recurrence — covers dev artifacts,
  fixture PDFs, internal architecture notes, and CI scripts

Side benefit: sdist size dropped from 2.4 MB to 304 KB (8× reduction),
mostly from excluding examples/*.pdf and the tests/ fixture PDF.

The /home/rpm leaks in prior versions are not credentials, just operator
paths — not yanking. Going forward the unpacked-sdist grep is mandatory
before each publish.
2026-05-05 17:38:13 -06:00

154 lines
3.9 KiB
TOML

[project]
name = "mcp-pdf"
version = "2.2.1"
description = "Secure FastMCP server for comprehensive PDF processing - text extraction, OCR, table extraction, forms, annotations, and more"
authors = [{name = "Ryan Malloy", email = "ryan@malloys.us"}]
readme = "README.md"
license = {text = "MIT"}
requires-python = ">=3.10"
keywords = [
"mcp",
"fastmcp",
"pdf",
"ocr",
"text-extraction",
"table-extraction",
"pdf-processing",
"api",
"integration"
]
classifiers = [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"License :: OSI Approved :: MIT License",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Topic :: Software Development :: Libraries :: Python Modules",
"Topic :: Text Processing :: General",
"Topic :: Office/Business",
]
dependencies = [
"fastmcp>=0.1.0",
"httpx>=0.25.0",
"pydantic>=2.0.0",
"python-dotenv>=1.0.0",
"PyMuPDF>=1.23.0",
"pdfplumber>=0.10.0",
"pytesseract>=0.3.10",
"pdf2image>=1.16.0",
"pypdf>=6.0.0",
"pandas>=2.0.0",
"Pillow>=10.0.0",
"markdown>=3.5.0",
]
[project.urls]
Homepage = "https://github.com/rsp2k/mcp-pdf"
Documentation = "https://github.com/rsp2k/mcp-pdf#readme"
Repository = "https://github.com/rsp2k/mcp-pdf.git"
Issues = "https://github.com/rsp2k/mcp-pdf/issues"
Changelog = "https://github.com/rsp2k/mcp-pdf/releases"
[project.scripts]
mcp-pdf = "mcp_pdf.server:main"
mcp-pdf-legacy = "mcp_pdf.server_legacy:main"
mcp-pdf-modular = "mcp_pdf.server_refactored:main"
[project.optional-dependencies]
# Form creation features (create_form_pdf, advanced form tools)
forms = [
"reportlab>=4.0.0",
]
# Advanced table extraction (camelot needs Ghostscript, tabula needs Java)
tables = [
"camelot-py[cv]>=0.11.0",
"tabula-py>=2.8.0",
]
# Markdown → PDF conversion (requires pandoc binary + a PDF engine such as
# xelatex, pdflatex, tectonic, weasyprint, or wkhtmltopdf)
markdown = [
"pypandoc>=1.13",
]
# All optional features
all = [
"reportlab>=4.0.0",
"camelot-py[cv]>=0.11.0",
"tabula-py>=2.8.0",
"pypandoc>=1.13",
]
# Development dependencies
dev = [
"pytest>=7.0.0",
"pytest-asyncio>=0.21.0",
"black>=23.0.0",
"ruff>=0.1.0",
"mypy>=1.0.0",
"build>=0.10.0",
"twine>=4.0.0",
"safety>=3.0.0",
"pip-audit>=2.0.0",
]
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"
# Keep dev-only artifacts out of the sdist that ships to PyPI.
# (The PII audit also runs against the unpacked sdist before each publish —
# see ~/.claude/rules/python.md.)
[tool.hatch.build.targets.sdist]
exclude = [
"CLAUDE.md", # operator-private project context
".env", ".env.local", # never ship credentials
".mcp.json", # contains local filesystem paths
".pytest_cache/",
".ruff_cache/",
"build/",
"dist/",
"examples/page_001.png",
"examples/*.pdf", # demo PDFs are large + not needed by end users
"examples/test_demo.*",
"tests/CopperSprings_DigitalPortfolio.pdf", # large fixture PDF
"test_security_features.py",
"test_integration.py",
"MCPMIXIN_*.md", # internal architecture/migration notes
"MCP_DOCX_TOOLS_PLAN.md",
"claude-mcp-manager", # personal helper script
"run-mcp-server.sh",
"docker-compose.yml",
"Dockerfile",
]
[tool.pytest.ini_options]
asyncio_mode = "auto"
addopts = "-v --tb=short"
testpaths = ["tests"]
python_files = ["test_*.py", "*_test.py"]
[tool.hatchling.build.targets.sdist]
include = [
"/src",
"/tests",
"/examples",
"README.md",
"LICENSE",
"MANIFEST.in",
]
[dependency-groups]
dev = [
"pip-audit>=2.9.0",
"pytest>=8.4.1",
"pytest-asyncio>=1.1.0",
"pytest-cov>=6.2.1",
"reportlab>=4.4.3",
"safety>=3.2.11",
"twine>=6.1.0",
]