{ "info": { "author": "Erick Fonseca", "author_email": "erickrfonseca@gmail.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 5 - Production/Stable", "Intended Audience :: Developers", "Intended Audience :: Science/Research", "License :: OSI Approved :: MIT License", "Programming Language :: Python :: 2.7", "Programming Language :: Python :: 3", "Topic :: Software Development :: Build Tools" ], "description": "Unitex Lemmatizer\n=================\n\nThis is a simple module for lemmatization based on the Unitex inflected word\nlist. As such, it needs a Unitex vocabulary file in order to work properly.\n\nSo far, I've only worked with Portuguese, with the\n`DELAF_PB file `_\nprovided by NILC.\n\nInstalling\n----------\n\nYou can either clone the repository and install with\n\n.. code-block:: bash\n\n $ python setup.py install\n\nor install through pip\n\n.. code-block:: bash\n\n $ pip install unitexlemmatizer\n\nUsage\n-----\n\nIn order to use the Unitex Lemmatizer, you need to tell it where the word list\nis:\n\n.. code-block:: python\n\n >>> import unitexlemmatizer as ul\n >>> ul.load_unitex_dictionary('/path/to/delaf.dic')\n\nThen, you can call the ``get_lemma`` function passing the inflected word and its\npart of speech tag (from the `Universal Dependencies `_\ntagset).\n\n.. code-block:: python\n\n >>> ul.get_lemma('corpora', 'noun')\n 'corpus'", "description_content_type": null, "docs_url": null, "download_url": null, "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/erickrf/unitex-lemmatizer", "keywords": "nlp,lemmatizer", "license": "MIT", "maintainer": null, "maintainer_email": null, "name": "unitexlemmatizer", "package_url": "https://pypi.org/project/unitexlemmatizer/", "platform": "UNKNOWN", "project_url": "https://pypi.org/project/unitexlemmatizer/", "project_urls": { "Homepage": "https://github.com/erickrf/unitex-lemmatizer" }, "release_url": "https://pypi.org/project/unitexlemmatizer/1.0.0/", "requires_dist": null, "requires_python": null, "summary": "A simple lemmatizer based on Unitex word lists", "version": "1.0.0" }, "last_serial": 2585506, "releases": { "1.0.0": [ { "comment_text": "", "digests": { "md5": "4811bf793feb638b997305efa3654171", "sha256": "5a7a4699e10a1b37efaac2e9404e8766c0e664c907bc1a89fcd37910756dac08" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0-py2.7.egg", "has_sig": false, "md5_digest": "4811bf793feb638b997305efa3654171", "packagetype": "bdist_egg", "python_version": "2.7", "requires_python": null, "size": 5083, "upload_time": "2017-01-19T16:48:14", "url": "https://files.pythonhosted.org/packages/f9/ae/bee3a227b4c623abd36c2354909354783a0a413e9bc11c5421c00b1ae1e9/unitexlemmatizer-1.0.0-py2.7.egg" }, { "comment_text": "", "digests": { "md5": "36a8f4d39f2d0b494158320ecb3faf6e", "sha256": "a493635169a21456d66e7587a065ec86e0fb80b926516198077335a60fd38df3" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "36a8f4d39f2d0b494158320ecb3faf6e", "packagetype": "bdist_wheel", "python_version": "py2.py3", "requires_python": null, "size": 4899, "upload_time": "2017-01-19T16:48:13", "url": "https://files.pythonhosted.org/packages/1e/d6/39ad1bd2dce9bd0d90faa64373a2fee48e89fe03e95da9b7a04cded0339b/unitexlemmatizer-1.0.0-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "e2b5ef3622bf8939bf6a9a39ce385bb4", "sha256": "6602ab1bdd8fd0946f6348718a6f6473814f81e8f77144e647dfee3645ff62a5" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0.tar.gz", "has_sig": false, "md5_digest": "e2b5ef3622bf8939bf6a9a39ce385bb4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2971, "upload_time": "2017-01-19T16:48:15", "url": "https://files.pythonhosted.org/packages/f5/7b/61b0192d541ccb055603d75bf52021b9399a5cf4a2ef22f0b09a34bbc208/unitexlemmatizer-1.0.0.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "4811bf793feb638b997305efa3654171", "sha256": "5a7a4699e10a1b37efaac2e9404e8766c0e664c907bc1a89fcd37910756dac08" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0-py2.7.egg", "has_sig": false, "md5_digest": "4811bf793feb638b997305efa3654171", "packagetype": "bdist_egg", "python_version": "2.7", "requires_python": null, "size": 5083, "upload_time": "2017-01-19T16:48:14", "url": "https://files.pythonhosted.org/packages/f9/ae/bee3a227b4c623abd36c2354909354783a0a413e9bc11c5421c00b1ae1e9/unitexlemmatizer-1.0.0-py2.7.egg" }, { "comment_text": "", "digests": { "md5": "36a8f4d39f2d0b494158320ecb3faf6e", "sha256": "a493635169a21456d66e7587a065ec86e0fb80b926516198077335a60fd38df3" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "36a8f4d39f2d0b494158320ecb3faf6e", "packagetype": "bdist_wheel", "python_version": "py2.py3", "requires_python": null, "size": 4899, "upload_time": "2017-01-19T16:48:13", "url": "https://files.pythonhosted.org/packages/1e/d6/39ad1bd2dce9bd0d90faa64373a2fee48e89fe03e95da9b7a04cded0339b/unitexlemmatizer-1.0.0-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "e2b5ef3622bf8939bf6a9a39ce385bb4", "sha256": "6602ab1bdd8fd0946f6348718a6f6473814f81e8f77144e647dfee3645ff62a5" }, "downloads": -1, "filename": "unitexlemmatizer-1.0.0.tar.gz", "has_sig": false, "md5_digest": "e2b5ef3622bf8939bf6a9a39ce385bb4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2971, "upload_time": "2017-01-19T16:48:15", "url": "https://files.pythonhosted.org/packages/f5/7b/61b0192d541ccb055603d75bf52021b9399a5cf4a2ef22f0b09a34bbc208/unitexlemmatizer-1.0.0.tar.gz" } ] }