{ "info": { "author": "digitalarbeiter", "author_email": "digitalarbeiter@talbriefkasten.de", "bugtrack_url": null, "classifiers": [], "description": "# Probabilistic Spell Checker in Python\n\nSpell checker based on edit distance (Levenshtein-ish) and word frequency\nin a training corpus.\n\n For theoretical background, see Peter Norvig's article,\nhttps://norvig.com/spell-correct.html\n\nComes with a dictionary trained from German Wikipedia articles.\n\nUsage:\n\n import json\n import re\n import probspellchecker\n\n spellchecker = probspellchecker.ProbabilisticSpellChecker(\n word_counts=json.load(open(\"dictionary_dewiki_full10plus.json\")),\n word_whitelist=[\"my\", \"custom\", \"wordlist\"],\n )\n\n text = \"lorem ipsum whatever\"\n for word in re.findall(r\"\\w+\", text):\n correction = spellchecker.correction(word.lower())\n if correction:\n print(correction)\n else:\n print(word)\n\nWord counts is just that, a dict with word to count mapping. To build your\nown dictionaries, see probdict-from-dewiki.py and probdict-from-text.py.\nYou may also specify a whitelist of words that should just be accepted by\nthe spell checker, which is useful if your name is not in the dictionary.\n\nIf your language sports special characters like the German umlauts, you\nmight need to pass an additional charset parameter which is a string with\nall allowed characters of your language, to the ProbabilisticSpellChecker.\nThis is then used to generate candidate words.\n\n## Logging\n\nIf the logging annoys you, just shut it up:\n\n spell_log = logging.getLogger(\"probspellchecker\")\n spell_log.setLevel(logging.ERROR) # log only errors\n\n\n\n", "description_content_type": "text/markdown", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/digitalarbeiter/probspellchecker", "keywords": "", "license": "LGPLv3", "maintainer": "", "maintainer_email": "", "name": "probspellchecker", "package_url": "https://pypi.org/project/probspellchecker/", "platform": "", "project_url": "https://pypi.org/project/probspellchecker/", "project_urls": { "Homepage": "https://github.com/digitalarbeiter/probspellchecker" }, "release_url": "https://pypi.org/project/probspellchecker/0.1.3/", "requires_dist": null, "requires_python": "", "summary": "probabilistic spell checker", "version": "0.1.3" }, "last_serial": 4235533, "releases": { "0.1.1": [ { "comment_text": "", "digests": { "md5": "e32599fca4cb1a705efe7a7981f87428", "sha256": "044b9c61560bac49412e6630ca1050ab0b660a3a4362dca29f9e329cd8108445" }, "downloads": -1, "filename": "probspellchecker-0.1.1-py3-none-any.whl", "has_sig": false, "md5_digest": "e32599fca4cb1a705efe7a7981f87428", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 5428, "upload_time": "2018-09-03T13:51:19", "url": "https://files.pythonhosted.org/packages/25/b3/212142966557e37abec211ba2663a2b4ff59a0770709f246592e486375eb/probspellchecker-0.1.1-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "5511f711e60de7c6d9d914a0edafa0cc", "sha256": "e2d04aa06a312d2c69261db1885ae5ff65d1c87b8f632d36d15752f1811d0b04" }, "downloads": -1, "filename": "probspellchecker-0.1.1.tar.gz", "has_sig": false, "md5_digest": "5511f711e60de7c6d9d914a0edafa0cc", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4266, "upload_time": "2018-09-03T13:51:20", "url": "https://files.pythonhosted.org/packages/ad/3d/c19ead6fa4b5fdf91e3ff27092abca088995afd11b7c7b8dc6d69a1c407f/probspellchecker-0.1.1.tar.gz" } ], "0.1.2": [ { "comment_text": "", "digests": { "md5": "9967571000ef3ec5503dbfb1bdce9c24", "sha256": "5cef450278961daa926d3ff861110bd70367ea1ee763bd2597942ebf94428dc8" }, "downloads": -1, "filename": "probspellchecker-0.1.2-py3-none-any.whl", "has_sig": false, "md5_digest": "9967571000ef3ec5503dbfb1bdce9c24", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 5415, "upload_time": "2018-09-03T20:09:16", "url": "https://files.pythonhosted.org/packages/b1/3d/919c146be25abbcdf886e2f40acd5104e306ebc651c1b9f60eded3eecf21/probspellchecker-0.1.2-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "dc0872cdc184b97d238ec93769c2e261", "sha256": "7125bd2d60e0d2234efec56fa9004033cc65e83d19c598ef24640d07ae67015a" }, "downloads": -1, "filename": "probspellchecker-0.1.2.tar.gz", "has_sig": false, "md5_digest": "dc0872cdc184b97d238ec93769c2e261", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4213, "upload_time": "2018-09-03T20:09:17", "url": "https://files.pythonhosted.org/packages/18/e9/82306c89a3d2717ec2a3b2d2529aabe269bc5434f0c77f235b7055e6ef80/probspellchecker-0.1.2.tar.gz" } ], "0.1.3": [ { "comment_text": "", "digests": { "md5": "14da1f3ec3af194ffe771640172d25ea", "sha256": "f497da79cb39d72af0ffdf97065c94425acc356a9442d917f90bb8eed0899029" }, "downloads": -1, "filename": "probspellchecker-0.1.3-py3-none-any.whl", "has_sig": false, "md5_digest": "14da1f3ec3af194ffe771640172d25ea", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 5415, "upload_time": "2018-09-03T20:51:15", "url": "https://files.pythonhosted.org/packages/46/37/d33a6ad59535a6dece54bc309cd565706b4824d0b28d5a5d5ba2754ab065/probspellchecker-0.1.3-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "9dba22856f02b9261e66a44860c973a1", "sha256": "735c1f46a8457fa9b28eebd878991d6189517ecc05848e833dd8240f160ea9bf" }, "downloads": -1, "filename": "probspellchecker-0.1.3.tar.gz", "has_sig": false, "md5_digest": "9dba22856f02b9261e66a44860c973a1", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4218, "upload_time": "2018-09-03T20:51:16", "url": "https://files.pythonhosted.org/packages/a3/d1/8230e6ee19220a074266fe59db4b1755739e7830c8973fe592e7366d281d/probspellchecker-0.1.3.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "14da1f3ec3af194ffe771640172d25ea", "sha256": "f497da79cb39d72af0ffdf97065c94425acc356a9442d917f90bb8eed0899029" }, "downloads": -1, "filename": "probspellchecker-0.1.3-py3-none-any.whl", "has_sig": false, "md5_digest": "14da1f3ec3af194ffe771640172d25ea", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 5415, "upload_time": "2018-09-03T20:51:15", "url": "https://files.pythonhosted.org/packages/46/37/d33a6ad59535a6dece54bc309cd565706b4824d0b28d5a5d5ba2754ab065/probspellchecker-0.1.3-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "9dba22856f02b9261e66a44860c973a1", "sha256": "735c1f46a8457fa9b28eebd878991d6189517ecc05848e833dd8240f160ea9bf" }, "downloads": -1, "filename": "probspellchecker-0.1.3.tar.gz", "has_sig": false, "md5_digest": "9dba22856f02b9261e66a44860c973a1", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4218, "upload_time": "2018-09-03T20:51:16", "url": "https://files.pythonhosted.org/packages/a3/d1/8230e6ee19220a074266fe59db4b1755739e7830c8973fe592e7366d281d/probspellchecker-0.1.3.tar.gz" } ] }