data-label-factory / pyproject.toml
waltgrace's picture
feat(identify): open-set image retrieval subpackage
37ddbc1 verified
raw
history blame
2.66 kB
[build-system]
requires = ["setuptools>=64", "wheel"]
build-backend = "setuptools.build_meta"
[project]
name = "data-label-factory"
version = "0.1.0"
description = "Generic auto-labeling pipeline for vision datasets — runs on a 16 GB Apple Silicon Mac via SSD-streaming MoE."
readme = "README.md"
requires-python = ">=3.10"
license = { text = "Apache-2.0" }
authors = [
{ name = "walter-grace" },
]
keywords = [
"vision",
"dataset",
"labeling",
"annotation",
"object-detection",
"mlx",
"apple-silicon",
"qwen",
"gemma",
"falcon-perception",
]
classifiers = [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"Intended Audience :: Science/Research",
"License :: OSI Approved :: Apache Software License",
"Operating System :: MacOS",
"Programming Language :: Python :: 3 :: Only",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Programming Language :: Python :: 3.13",
"Topic :: Scientific/Engineering :: Image Recognition",
]
dependencies = [
"pyyaml>=6.0",
"pillow>=9.0",
"requests>=2.28",
]
[project.optional-dependencies]
gather = [
# Image-search gathering (DDG, Wikimedia, YouTube frame extraction)
"duckduckgo-search>=4.0",
"yt-dlp>=2024.0.0",
]
runpod = [
# Optional GPU path: orchestrate a RunPod pod, publish to HF when done
"runpod>=1.7.0",
"huggingface_hub>=0.26",
"datasets>=3.0",
"pyarrow>=17.0",
]
identify = [
# Open-set CLIP retrieval: build/verify/train/serve a card-style index
"torch>=2.1",
"torchvision>=0.16",
"numpy>=1.24,<2",
"fastapi>=0.115",
"uvicorn[standard]>=0.32",
"python-multipart>=0.0.20",
"pillow>=10.0",
"ultralytics>=8.3",
"clip @ git+https://github.com/openai/CLIP.git",
]
dev = [
"pytest>=7.0",
"ruff>=0.5.0",
]
[project.urls]
Homepage = "https://github.com/walter-grace/data-label-factory"
Repository = "https://github.com/walter-grace/data-label-factory"
HuggingFace = "https://huggingface.co/waltgrace/data-label-factory"
Issues = "https://github.com/walter-grace/data-label-factory/issues"
[project.scripts]
data_label_factory = "data_label_factory.cli:main"
data-label-factory = "data_label_factory.cli:main"
[tool.setuptools]
packages = [
"data_label_factory",
"data_label_factory.runpod",
"data_label_factory.identify",
]
[tool.setuptools.package-data]
data_label_factory = ["*.py"]
"data_label_factory.runpod" = ["*.py", "*.md", "Dockerfile", "requirements-pod.txt"]
"data_label_factory.identify" = ["*.py", "*.md"]