{ "info": { "author": "Alex Kritikos", "author_email": "alex@8bitb.us", "bugtrack_url": null, "classifiers": [], "description": "Patu\n====\n\nA small spider, useful for checking a site for 404s and 500s. Patu requires httplib2 and lxml:\n\n pip install -U httplib2 lxml\n\nQuick Usage\n===========\n\nTo see available options:\n\n patu.py --help\n\nTo spider an entire site using 5 workers, only showing errors:\n\n patu.py --spiders=5 www.example.com\n \nTo spider, stopping after the first level of links:\n\n patu.py --depth=1 www.example.com\n \nTo get a list of every linked page on a site:\n\n patu.py --generate www.example.com > urls.txt\n \nInstead of spidering for URLs, use a file instead and show all responses:\n\n patu.py --input=urls.txt --verbose www.example.com\n\nFormat of URLs File\n===================\n\nThe output produced by --generate is formatted like so:\n\n FIRST_URLNone\n LINK1REFERER\n LINK2REFERER\n \n--input can take a file of that format, or one URL per line with no referer. --input=- reads from stdin.\n\nTesting\n=======\n\nPatu uses Nose for testing. To install Nose and test:\n\n pip install -U nose\n nosetests", "description_content_type": null, "docs_url": null, "download_url": "UNKNOWN", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://github.com/akrito/patu", "keywords": null, "license": "UNKNOWN", "maintainer": null, "maintainer_email": null, "name": "patu", "package_url": "https://pypi.org/project/patu/", "platform": "UNKNOWN", "project_url": "https://pypi.org/project/patu/", "project_urls": { "Download": "UNKNOWN", "Homepage": "http://github.com/akrito/patu" }, "release_url": "https://pypi.org/project/patu/0.1/", "requires_dist": null, "requires_python": null, "summary": "Patu is a small spider", "version": "0.1" }, "last_serial": 796066, "releases": { "0.1": [ { "comment_text": "", "digests": { "md5": "920fa7869446408bf1641dc98be1ee64", "sha256": "3d57674b597576f66602e1e8a80339fab9d629b587c8bdae2d69db541c19e472" }, "downloads": -1, "filename": "patu-0.1.tar.gz", "has_sig": false, "md5_digest": "920fa7869446408bf1641dc98be1ee64", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 9077, "upload_time": "2010-05-19T05:29:08", "url": "https://files.pythonhosted.org/packages/43/d4/45fbd3af3708aea8cf1a41a5cab2572c2db9aadd57506f3f6e3e1b3bfe82/patu-0.1.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "920fa7869446408bf1641dc98be1ee64", "sha256": "3d57674b597576f66602e1e8a80339fab9d629b587c8bdae2d69db541c19e472" }, "downloads": -1, "filename": "patu-0.1.tar.gz", "has_sig": false, "md5_digest": "920fa7869446408bf1641dc98be1ee64", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 9077, "upload_time": "2010-05-19T05:29:08", "url": "https://files.pythonhosted.org/packages/43/d4/45fbd3af3708aea8cf1a41a5cab2572c2db9aadd57506f3f6e3e1b3bfe82/patu-0.1.tar.gz" } ] }