{ "info": { "author": "Christian Peccei", "author_email": "cpeccei@hotmail.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 5 - Production/Stable", "Intended Audience :: Developers", "Intended Audience :: Science/Research", "License :: OSI Approved :: GNU General Public License (GPL)", "Natural Language :: English", "Operating System :: OS Independent", "Programming Language :: Python", "Topic :: Scientific/Engineering :: Artificial Intelligence", "Topic :: Scientific/Engineering :: Information Analysis", "Topic :: Text Processing :: General", "Topic :: Text Processing :: Linguistic" ], "description": "This package contains a variety of useful functions for text mining in Python.\r\nIt focuses on statistical text mining (i.e. the bag-of-words model) and makes it\r\nvery easy to create a term-document matrix from a collection of documents. This\r\nmatrix can then be read into a statistical package (R, MATLAB, etc.) for further\r\nanalysis. The package also provides some useful utilities for finding\r\ncollocations (i.e. significant two-word phrases), computing the edit distance\r\nbetween words, and chunking long documents up into smaller pieces.\r\n\r\nThe package has a large amount of curated data (stopwords, common names, an\r\nEnglish dictionary with parts of speech and word frequencies) which allows the\r\nuser to extract fairly sophisticated features from a document.\r\n\r\nThis package does NOT have any natural language processing capabilities such as\r\npart-of-speech tagging. Please see the Python NLTK for that sort of\r\nfunctionality (plus much, much more).", "description_content_type": null, "docs_url": null, "download_url": "UNKNOWN", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://www.christianpeccei.com/textmining", "keywords": "", "license": "UNKNOWN", "maintainer": "", "maintainer_email": "", "name": "textmining", "package_url": "https://pypi.org/project/textmining/", "platform": "UNKNOWN", "project_url": "https://pypi.org/project/textmining/", "project_urls": { "Download": "UNKNOWN", "Homepage": "http://www.christianpeccei.com/textmining" }, "release_url": "https://pypi.org/project/textmining/1.0/", "requires_dist": null, "requires_python": null, "summary": "Python Text Mining Utilities", "version": "1.0" }, "last_serial": 1337712, "releases": { "1.0": [ { "comment_text": "", "digests": { "md5": "606edecbdc88fdea701a4e4c494a4ff3", "sha256": "846bda6402a0d399a039885ad8f02da7ddd49c785a7a9d7c13417ffc3ae58086" }, "downloads": -1, "filename": "textmining-1.0.zip", "has_sig": false, "md5_digest": "606edecbdc88fdea701a4e4c494a4ff3", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 1856371, "upload_time": "2010-11-01T22:06:49", "url": "https://files.pythonhosted.org/packages/f7/ca/3fb84b7fc0f5e51c4f8d4e6ba5bb5cc833410700bcec22594eefe072febe/textmining-1.0.zip" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "606edecbdc88fdea701a4e4c494a4ff3", "sha256": "846bda6402a0d399a039885ad8f02da7ddd49c785a7a9d7c13417ffc3ae58086" }, "downloads": -1, "filename": "textmining-1.0.zip", "has_sig": false, "md5_digest": "606edecbdc88fdea701a4e4c494a4ff3", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 1856371, "upload_time": "2010-11-01T22:06:49", "url": "https://files.pythonhosted.org/packages/f7/ca/3fb84b7fc0f5e51c4f8d4e6ba5bb5cc833410700bcec22594eefe072febe/textmining-1.0.zip" } ] }