{ "info": { "author": "Oscar Sanchez", "author_email": "hmax.bf4@gmail.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 4 - Beta", "Environment :: Web Environment", "Intended Audience :: Developers", "License :: OSI Approved :: MIT License", "Natural Language :: English", "Operating System :: OS Independent", "Programming Language :: Python" ], "description": "Python Scraper\n==============\n\nA simple web scraper made in python with love:\n\nInstall with pip:\n-----------------\n\n.. code:: sh\n\n pip install simplescraper\n\n\nUsage:\n------\n\nMake a simple call to a web page, lets call 'www.test.com'\n\n.. code:: python\n\n from simplescraper import SimpleScraper\n\n test = SimpleScraper()\n result = test.get_scraped_data('www.test.com')\n print result\n\noutput:\n~~~~~~~\n\n.. code:: javascript\n\n {\n url: 'http://www.test.com', \n source: 'www.test.com', \n image: 'http://www.test.com/some/random/image.png',\n title: 'Just a test page'\n }\n\nYou can also call it without using the 'www' as 'test.com' if the web page has a redirection. If the web page needs the usage of the https protocol to be accessed you can call it as: 'https://www.test.com', this is not mandatory since the scraper checks if the protocol is needed.\n\nGet iframe:\n~~~~~~~~~~~\n\n.. code:: python\n\n result = test.get_scraped_data('https://www.youtube.com/watch?v=dQw4w9WgXcQ')\n \noutput:\n~~~~~~~\n\n.. code:: javascript\n\n {\n description: 'Rick Astley - Never Gonna Give You Up (Official Music Video) - Listen On Spotify: http://smarturl.it/AstleySpotify Download Rick\\'s Number 1 album \"50\" - http...', \n title: 'Rick Astley - Never Gonna Give You Up', \n url: 'https://www.youtube.com/watch?v=dQw4w9WgXcQ', \n image: 'https://i.ytimg.com/vi/dQw4w9WgXcQ/maxresdefault.jpg', \n source: 'www.youtube.com', \n iframe: ''\n }\nThis is on `GitHub `__ so let me\nknow if I've broked it somewhere.\n\nStuff used to make this:\n~~~~~~~~~~~~~~~~~~~~~~~~\n\n- `beautifulsoup4 `__\n for Markdown language parsing\n- `html5lib `__ for the\n awesome html5 parser", "description_content_type": null, "docs_url": null, "download_url": "UNKNOWN", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/ROZ32/pythonScraper", "keywords": null, "license": "MIT License", "maintainer": null, "maintainer_email": null, "name": "simplescraper", "package_url": "https://pypi.org/project/simplescraper/", "platform": "any", "project_url": "https://pypi.org/project/simplescraper/", "project_urls": { "Download": "UNKNOWN", "Homepage": "https://github.com/ROZ32/pythonScraper" }, "release_url": "https://pypi.org/project/simplescraper/0.1.3/", "requires_dist": null, "requires_python": null, "summary": "A simple python web scraper", "version": "0.1.3" }, "last_serial": 2818315, "releases": { "0.1": [], "0.1.1": [ { "comment_text": "", "digests": { "md5": "25251db30a33990df3b8626ea2b6fcc0", "sha256": "4941c2436dece4fae3c57a3249b06599e4f67f1d75e11703a58626e53e5da254" }, "downloads": -1, "filename": "simplescraper-0.1.1-py2-none-any.whl", "has_sig": false, "md5_digest": "25251db30a33990df3b8626ea2b6fcc0", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 2757, "upload_time": "2017-04-14T01:05:33", "url": "https://files.pythonhosted.org/packages/8a/1f/f146dc6bd6bd8e676c8b3c28d9e997934467629695759e9400bfebc9f012/simplescraper-0.1.1-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "61e50cb37f8280df2529c5a9e7e3fee1", "sha256": "f309f021b5c8b26f95b0a42855e3f4faa9dc69efa769dd6ddb1e9ff49261cf3c" }, "downloads": -1, "filename": "simplescraper-0.1.1.tar.gz", "has_sig": false, "md5_digest": "61e50cb37f8280df2529c5a9e7e3fee1", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2331, "upload_time": "2017-04-14T00:55:07", "url": "https://files.pythonhosted.org/packages/97/bc/2438ea33f443d29bf94fe025108694b834e0ab9d2e82ea503f1a3bd9455b/simplescraper-0.1.1.tar.gz" } ], "0.1.2": [ { "comment_text": "", "digests": { "md5": "d3c6594a5652421a896650599336f8ab", "sha256": "29c93e44bdd0641cf9053209c25f9761410786c46563ca3983c3ae4f47947e77" }, "downloads": -1, "filename": "simplescraper-0.1.2-py2-none-any.whl", "has_sig": false, "md5_digest": "d3c6594a5652421a896650599336f8ab", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 5401, "upload_time": "2017-04-14T04:31:52", "url": "https://files.pythonhosted.org/packages/73/0d/71a81a1d7c785b8cff58e26bdac3743b149c1188a69dcb57375fe4984908/simplescraper-0.1.2-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "b47016b9c82a646d22e3baef28299557", "sha256": "a4bc66674a2c02fdfe4e148115f93662880b8902bf9d4053f909364c607df15c" }, "downloads": -1, "filename": "simplescraper-0.1.2.tar.gz", "has_sig": false, "md5_digest": "b47016b9c82a646d22e3baef28299557", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4513, "upload_time": "2017-04-14T04:31:53", "url": "https://files.pythonhosted.org/packages/fb/c6/a1bc678fdd123c07ade1fee3131e2e45c2a8df97bc98d95ae127f1672a5e/simplescraper-0.1.2.tar.gz" } ], "0.1.3": [ { "comment_text": "", "digests": { "md5": "d981f5b00ad259ef8d1138f809154b31", "sha256": "eaa1e4cae29aeddd2bb8a5a906c9e2922908bd44a5dd61451a2c4a69b57a1665" }, "downloads": -1, "filename": "simplescraper-0.1.3-py2-none-any.whl", "has_sig": false, "md5_digest": "d981f5b00ad259ef8d1138f809154b31", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 6720, "upload_time": "2017-04-20T19:17:20", "url": "https://files.pythonhosted.org/packages/1f/47/5705e0894bd78e4de58d421b4e7865a74349f636e95ef23ec028ba462998/simplescraper-0.1.3-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "73e398979eefb38071ad12d295d6d090", "sha256": "ffc5ea8dfac2ea40a90555a2b47a4b7695662db586990791554a3f02958a2598" }, "downloads": -1, "filename": "simplescraper-0.1.3.tar.gz", "has_sig": false, "md5_digest": "73e398979eefb38071ad12d295d6d090", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 5375, "upload_time": "2017-04-20T19:17:22", "url": "https://files.pythonhosted.org/packages/88/23/c795b24c0359481a305f0c758248242c3ac7a193101fa87e3e44b111525a/simplescraper-0.1.3.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "d981f5b00ad259ef8d1138f809154b31", "sha256": "eaa1e4cae29aeddd2bb8a5a906c9e2922908bd44a5dd61451a2c4a69b57a1665" }, "downloads": -1, "filename": "simplescraper-0.1.3-py2-none-any.whl", "has_sig": false, "md5_digest": "d981f5b00ad259ef8d1138f809154b31", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 6720, "upload_time": "2017-04-20T19:17:20", "url": "https://files.pythonhosted.org/packages/1f/47/5705e0894bd78e4de58d421b4e7865a74349f636e95ef23ec028ba462998/simplescraper-0.1.3-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "73e398979eefb38071ad12d295d6d090", "sha256": "ffc5ea8dfac2ea40a90555a2b47a4b7695662db586990791554a3f02958a2598" }, "downloads": -1, "filename": "simplescraper-0.1.3.tar.gz", "has_sig": false, "md5_digest": "73e398979eefb38071ad12d295d6d090", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 5375, "upload_time": "2017-04-20T19:17:22", "url": "https://files.pythonhosted.org/packages/88/23/c795b24c0359481a305f0c758248242c3ac7a193101fa87e3e44b111525a/simplescraper-0.1.3.tar.gz" } ] }