{ "info": { "author": "Graham Poulter", "author_email": "", "bugtrack_url": null, "classifiers": [ "Development Status :: 5 - Production/Stable", "Intended Audience :: Developers", "License :: OSI Approved :: GNU Lesser General Public License v3 (LGPLv3)", "License :: OSI Approved :: GNU Lesser General Public License v3 or later (LGPLv3+)", "License :: OSI Approved :: GNU Library or Lesser General Public License (LGPL)", "Natural Language :: English", "Operating System :: OS Independent", "Programming Language :: Python", "Programming Language :: Python :: 2", "Programming Language :: Python :: 2.6", "Programming Language :: Python :: 2.7", "Programming Language :: Python :: 3", "Programming Language :: Python :: 3.2", "Topic :: Text Processing", "Topic :: Text Processing :: Indexing", "Topic :: Text Processing :: Linguistic" ], "description": "The NGram class extends the Python 'set' class with efficient\nfuzzy search for members by means of an N-gram similarity measure.\nIt also has static methods to compare a pair of strings.\n\nThe N-grams are character based not word-based, and the class does not\nimplement a language model, merely searching for members by string similarity.\n\nThe `documentation`_, `tutorial`_ and `release notes`_ are on the\nPyPI package documentation site. Please use the `GitHub issue tracker`_\nto report issues.\n\nInstallation\n============\n\nInstall python-ngram from `PyPI`_ using `pip installer`_::\n\n pip install ngram\n\nIt should run on Python 2.6, Python 2.7 and Python 3.2\n\nHow does it work?\n=================\n\nThe set stores arbitrary items, but for non-string items a `key` function\n(such as `str`) must be specified to provide a string represenation. The key\nfunction can also be used to normalise string items (e.g. lower-casing) prior\nto N-gram indexing.\n\nTo index a string it pads the string with a specified dummy character, then\nsplits it into overlapping substrings of N (default N=3) characters in length\nand associates each N-gram to the items that use it.\n\nTo find items similar to a query string, it splits the query into N-grams,\ncollects all items sharing at least one N-gram with the query,\nand ranks the items by score based on the ratio of shared to unshared\nN-grams between strings.\n\nHistory\n=======\n\nIn 2007, Michel Albert (exhuma) wrote the python-ngram module based on Perl's\n`String::Trigram`_ module by Tarek Ahmed, and committed the code for 2.0.0b2 to\na now-disused `Sourceforge`_ subversion repo.\n\nSince late 2008, Graham Poulter has maintained python-ngram, initially refactoring\nit to build on the `set` class, and also adding features, documentation, tests,\nperformance improvements and Python 3 support.\n\nPrimary development takes place on `GitHub`_, but changes are also pushed\nto the earlier repo on `Google Code`_.\n\n.. _documentation: http://packages.python.org/ngram/\n.. _tutorial: http://packages.python.org/ngram/tutorial.html\n.. _release notes: http://packages.python.org/ngram/releasenotes.html\n.. _GitHub issue tracker: https://github.com/gpoulter/python-ngram/issues\n.. _PyPI: http://pypi.python.org/pypi/ngram\n.. _pip installer: http://www.pip-installer.org\n.. _String::Trigram: http://search.cpan.org/dist/String-Trigram/\n.. _Sourceforge: https://sourceforge.net/projects/python-ngram/\n.. _GitHub: http://github.com/gpoulter/python-ngram\n.. _Google Code: http://code.google.com/p/python-ngram/\n", "description_content_type": null, "docs_url": "https://pythonhosted.org/ngram/", "download_url": "http://pypi.python.org/pypi/ngram", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://github.com/gpoulter/python-ngram", "keywords": "ngram set string text similarity", "license": "LGPLv3+", "maintainer": "", "maintainer_email": "", "name": "ngram", "package_url": "https://pypi.org/project/ngram/", "platform": "any", "project_url": "https://pypi.org/project/ngram/", "project_urls": { "Download": "http://pypi.python.org/pypi/ngram", "Homepage": "http://github.com/gpoulter/python-ngram" }, "release_url": "https://pypi.org/project/ngram/3.3.2/", "requires_dist": null, "requires_python": "", "summary": "A `set` subclass providing fuzzy search based on N-grams.", "version": "3.3.2" }, "last_serial": 2963183, "releases": { "2.0.0b2": [ { "comment_text": "", "digests": { "md5": "d18014c094b66a67dcccc9ef018cb67b", "sha256": "0feb2f59982e92e715f61ff8ac34216827229bacc3065b34d2bde930c0200bd9" }, "downloads": -1, "filename": "ngram-2.0.0b2.tar.gz", "has_sig": false, "md5_digest": "d18014c094b66a67dcccc9ef018cb67b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 13565, "upload_time": "2007-10-23T13:13:23", "url": "https://files.pythonhosted.org/packages/0c/96/d6724f54b9064696923cd526258c72c6bf163d5c950592a9d4ec392b489f/ngram-2.0.0b2.tar.gz" } ], "3.0": [ { "comment_text": "", "digests": { "md5": "784450fe017baf00cbde9503d490bdd3", "sha256": "16672a1882878457f751889ac3f98b9ae0fd22ffa147bf7ba872f5ba319852b2" }, "downloads": -1, "filename": "ngram-3.0-py2.5.egg", "has_sig": false, "md5_digest": "784450fe017baf00cbde9503d490bdd3", "packagetype": "bdist_egg", "python_version": "2.5", "requires_python": null, "size": 10603, "upload_time": "2009-07-03T16:38:43", "url": "https://files.pythonhosted.org/packages/4e/c7/476a767832acb7a2f99d0b562e78f276b777ee206efc86f065df01fadc69/ngram-3.0-py2.5.egg" }, { "comment_text": "", "digests": { "md5": "26c1c03a4d09049d924c7a5a67bfeeb2", "sha256": "ec24118ce5f4b730d5f91e8f410975bbacfd586e18709d47aa8cd571238dbd88" }, "downloads": -1, "filename": "ngram-3.0-py2.6.egg", "has_sig": false, "md5_digest": "26c1c03a4d09049d924c7a5a67bfeeb2", "packagetype": "bdist_egg", "python_version": "2.6", "requires_python": null, "size": 10598, "upload_time": "2009-07-03T16:52:47", "url": "https://files.pythonhosted.org/packages/21/0e/0ebcaa38def41fdb9949bc5689e191444bbf7ba4f3033bf8e0c9ea373d3a/ngram-3.0-py2.6.egg" }, { "comment_text": "", "digests": { "md5": "2af73f0a1152570b78ec77fd19b1ad9b", "sha256": "720c87632035080796b635e3eddea8aa2ccce54f6a6aa594847f6464aff966b1" }, "downloads": -1, "filename": "ngram-3.0.tar.gz", "has_sig": false, "md5_digest": "2af73f0a1152570b78ec77fd19b1ad9b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 19136, "upload_time": "2009-07-03T16:38:59", "url": "https://files.pythonhosted.org/packages/a5/73/fff9959d4cb87c05b3647fc724e2fc23350da80acb1674eff2ff15f23c23/ngram-3.0.tar.gz" } ], "3.1": [ { "comment_text": "", "digests": { "md5": "12efe775ac4ce5e7542bcfc90767a937", "sha256": "5a5461de9654b4b2b9b0743725e2b29a563d18a1457c33812a59648e52c59106" }, "downloads": -1, "filename": "ngram-3.1-py2.6.egg", "has_sig": false, "md5_digest": "12efe775ac4ce5e7542bcfc90767a937", "packagetype": "bdist_egg", "python_version": "2.6", "requires_python": null, "size": 10959, "upload_time": "2009-12-07T13:08:30", "url": "https://files.pythonhosted.org/packages/eb/7e/4e9e3a3cd22c1ee35fd252a5f4ecbaa218b7d33bc0b09908cbafc5f5d6d7/ngram-3.1-py2.6.egg" }, { "comment_text": "", "digests": { "md5": "3b048dae3484ace03d29fc306245eba2", "sha256": "5c76a3721944fc37559cd36b06d2f81699b760752f7dd32a8017e47bb9bd6afe" }, "downloads": -1, "filename": "ngram-3.1-py3.1.egg", "has_sig": false, "md5_digest": "3b048dae3484ace03d29fc306245eba2", "packagetype": "bdist_egg", "python_version": "3.1", "requires_python": null, "size": 9865, "upload_time": "2009-12-07T13:08:44", "url": "https://files.pythonhosted.org/packages/7d/09/b160d19250549b45815c07ce48614d17f82ce8eff76311489b7d28e2fd9f/ngram-3.1-py3.1.egg" }, { "comment_text": "", "digests": { "md5": "a951c3ef2ede6dbcdd4d4b561e45c93d", "sha256": "12146c9872b9622381546ea15708208c079805fac06187551567e3e577b97f8c" }, "downloads": -1, "filename": "ngram-3.1.tar.gz", "has_sig": false, "md5_digest": "a951c3ef2ede6dbcdd4d4b561e45c93d", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 25326, "upload_time": "2009-12-07T13:08:30", "url": "https://files.pythonhosted.org/packages/06/e7/630caee9547f75e8b68ea510b4509372e49e2d54f341f7347df5a9af9333/ngram-3.1.tar.gz" }, { "comment_text": "", "digests": { "md5": "32ae2015664c5f5ee286e10df1264fc6", "sha256": "215d12e6f260eaadf11463393ceedbbc32e703c98b6a55ba95dbe19cdb475dd4" }, "downloads": -1, "filename": "ngram-3.1.win32-py2.6.exe", "has_sig": false, "md5_digest": "32ae2015664c5f5ee286e10df1264fc6", "packagetype": "bdist_wininst", "python_version": "2.6", "requires_python": null, "size": 202372, "upload_time": "2009-12-07T13:23:01", "url": "https://files.pythonhosted.org/packages/de/1c/5a70a86fe8b61a94cf4f0cd50f4659e75da3992bda6bf1b21fce89e23711/ngram-3.1.win32-py2.6.exe" } ], "3.2": [ { "comment_text": "", "digests": { "md5": "bcc2e195d547bbc9cff15113024819a6", "sha256": "968783ead6efca1b469f32defe51eaaeea65ffaaefe32d9809c0b77d9d23e9d2" }, "downloads": -1, "filename": "ngram-3.2.tar.gz", "has_sig": false, "md5_digest": "bcc2e195d547bbc9cff15113024819a6", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 8226, "upload_time": "2012-06-25T17:18:16", "url": "https://files.pythonhosted.org/packages/0f/d9/f9539b46a3e625577f78928ff5eaaefc81bf3512e8b5c3417ceaabb844f3/ngram-3.2.tar.gz" } ], "3.2.1": [ { "comment_text": "", "digests": { "md5": "0bad573163b51cbbda068513c35fe7fb", "sha256": "cdaedeb789b325b6d5c8113fa47172d9e931a7245ff89d1faa7a5d2527bb0633" }, "downloads": -1, "filename": "ngram-3.2.1.tar.gz", "has_sig": false, "md5_digest": "0bad573163b51cbbda068513c35fe7fb", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 8019, "upload_time": "2012-06-28T16:44:33", "url": "https://files.pythonhosted.org/packages/e2/d0/4973894f58866e7be44f19c484a32317f3680b940324d99b1e4bdbd9efb6/ngram-3.2.1.tar.gz" } ], "3.3.0": [ { "comment_text": "", "digests": { "md5": "7874f4b7daba5680e9dadda889ebf007", "sha256": "ea848fa3dfabbd5a1afdee4fe1871337c6c6a7225cac9ec5f2de8223ac2223db" }, "downloads": -1, "filename": "ngram-3.3.0.tar.gz", "has_sig": false, "md5_digest": "7874f4b7daba5680e9dadda889ebf007", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 8847, "upload_time": "2012-06-29T16:07:07", "url": "https://files.pythonhosted.org/packages/78/ff/4a7a88047fe50ab9806446488730ab3f74fc277be2357ac46f6f0c9b0227/ngram-3.3.0.tar.gz" } ], "3.3.2": [ { "comment_text": "", "digests": { "md5": "6e4c95cfb01636e6fb6c368d926327cb", "sha256": "f6f7f5e1126f3f72a5a2f854e1defebf55082448a6532d04fba522da811f44f8" }, "downloads": -1, "filename": "ngram-3.3.2.tar.gz", "has_sig": false, "md5_digest": "6e4c95cfb01636e6fb6c368d926327cb", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 31644, "upload_time": "2017-06-20T20:44:19", "url": "https://files.pythonhosted.org/packages/3b/84/707fdecbe63e67345db200a86274686d58fd3da805da53c80c5942d90393/ngram-3.3.2.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "6e4c95cfb01636e6fb6c368d926327cb", "sha256": "f6f7f5e1126f3f72a5a2f854e1defebf55082448a6532d04fba522da811f44f8" }, "downloads": -1, "filename": "ngram-3.3.2.tar.gz", "has_sig": false, "md5_digest": "6e4c95cfb01636e6fb6c368d926327cb", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 31644, "upload_time": "2017-06-20T20:44:19", "url": "https://files.pythonhosted.org/packages/3b/84/707fdecbe63e67345db200a86274686d58fd3da805da53c80c5942d90393/ngram-3.3.2.tar.gz" } ] }