{ "info": { "author": "Dwayne V Campbell", "author_email": "dwaynecampbell13 _at_ gmail.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 4 - Beta", "Intended Audience :: Developers", "License :: OSI Approved :: MIT License", "Topic :: Scientific/Engineering", "Topic :: Software Development :: Libraries :: Python Modules", "Topic :: Text Processing", "Topic :: Text Processing :: General", "Topic :: Utilities" ], "description": "News Corpus Builder\r\n\r\nA simple module that can be used to quickly build a corpus from news articles. The generated corpus can be stored in a sqlite database or as flat files.\r\n\r\nSee http://skillachie.github.io/news-corpus-builder/ for installation and usage", "description_content_type": null, "docs_url": null, "download_url": "https://github.com/skillachie/news_corpus_builder", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://skillachie.github.io/news-corpus-builder/", "keywords": "corpus, nlp news,extractor,web scrapping, natural language processing", "license": "MIT License", "maintainer": "", "maintainer_email": "", "name": "news-corpus-builder", "package_url": "https://pypi.org/project/news-corpus-builder/", "platform": "UNKNOWN", "project_url": "https://pypi.org/project/news-corpus-builder/", "project_urls": { "Download": "https://github.com/skillachie/news_corpus_builder", "Homepage": "http://skillachie.github.io/news-corpus-builder/" }, "release_url": "https://pypi.org/project/news-corpus-builder/0.1.4/", "requires_dist": null, "requires_python": null, "summary": "Quickly build a news/web corpus with specifc topics or terms automatically from Google News or by specifying article links in a file. This module automatically extracts the body and title from each article and saves the result to either flatfiles or sqlite database.", "version": "0.1.4" }, "last_serial": 1749902, "releases": { "0.1.1": [ { "comment_text": "", "digests": { "md5": "6f0fc69fc32aa36003559a1950ef747b", "sha256": "cd63f09c7f63c9f8209541cfdfb18c909f61e6b74dc87265d879bcb47cb38241" }, "downloads": -1, "filename": "news-corpus-builder-0.1.2.zip", "has_sig": false, "md5_digest": "6f0fc69fc32aa36003559a1950ef747b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 6067, "upload_time": "2015-09-05T04:04:27", "url": "https://files.pythonhosted.org/packages/0c/24/5a8b121b35d0c64f9e9611744b570d59583b1258f8cda1a9a13b0b946194/news-corpus-builder-0.1.2.zip" } ], "0.1.2": [ { "comment_text": "", "digests": { "md5": "9a9490f1acdd9b650d1ca9a81f7343ec", "sha256": "3b28f9b01e3d401e088890f1eda59e7a377a912c0e6af9669267cc5833ad35fb" }, "downloads": -1, "filename": "news-corpus-builder-0.1.4.zip", "has_sig": false, "md5_digest": "9a9490f1acdd9b650d1ca9a81f7343ec", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 6158, "upload_time": "2015-10-03T02:45:15", "url": "https://files.pythonhosted.org/packages/63/bb/8678fa71a5f2fb02691771d1803477eeda82f56ad877705cb8b622bf2965/news-corpus-builder-0.1.4.zip" } ], "0.1.4": [ { "comment_text": "", "digests": { "md5": "c620a67dbc812d6fa403b3ed27c1fd90", "sha256": "1494f5e793f4bd1d7f04b869463167c2db0f09b98061c386708bd0f78b687895" }, "downloads": -1, "filename": "news-corpus-builder-0.1.5.zip", "has_sig": false, "md5_digest": "c620a67dbc812d6fa403b3ed27c1fd90", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 6158, "upload_time": "2015-10-03T02:50:28", "url": "https://files.pythonhosted.org/packages/5d/e1/43b98c242ce342d30fd574751513dbb6f75137503893e30813abec278ae5/news-corpus-builder-0.1.5.zip" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "c620a67dbc812d6fa403b3ed27c1fd90", "sha256": "1494f5e793f4bd1d7f04b869463167c2db0f09b98061c386708bd0f78b687895" }, "downloads": -1, "filename": "news-corpus-builder-0.1.5.zip", "has_sig": false, "md5_digest": "c620a67dbc812d6fa403b3ed27c1fd90", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 6158, "upload_time": "2015-10-03T02:50:28", "url": "https://files.pythonhosted.org/packages/5d/e1/43b98c242ce342d30fd574751513dbb6f75137503893e30813abec278ae5/news-corpus-builder-0.1.5.zip" } ] }