uvicorn crawler_api:app --host 0.0.0.0 --port 8000
python crawler_api.py
curl -X POST http://localhost:8000/start
curl -X POST http://localhost:8000/start
-H "Content-Type: application/json"
-d '{"max_pages": 50000, "num_workers": 8}'
kvs_worker/ ├── pt-crawl/ │ ├── __ab/ │ │ └── abc123def456... │ └── __cd/ │ └── cde789... └── pt-hosts/ └── en.wikipedia.org
POST /start # Start crawling (optional: custom seeds, max_pages, etc.) POST /stop # Stop crawling GET /status # Progress, rate, ETA, queue size GET /stats # Detailed stats (top domains, etc.)