{ "info": { "author": "Martijn van der Klis", "author_email": "m.h.vanderklis@uu.nl", "bugtrack_url": null, "classifiers": [ "License :: OSI Approved :: MIT License", "Operating System :: OS Independent", "Programming Language :: Python :: 2.7", "Topic :: Text Processing :: Linguistic" ], "description": "# treetagger-xml\n\nThis is a simple script (`process.py`) that reads in a .xml-file, uses TreeTagger to parse/lemmatize each sentence, and then to output the input file with the tags and lemmata appended to the word elements.\n\n## Requirements\n\n### TreeTagger\n\nSee [the TreeTagger website](http://www.cis.uni-muenchen.de/~schmid/tools/TreeTagger/) for installation instructions. Note that you'll have to download a paramater file for each language you would want to tag/lemmatize. This script has been tested on version 3.2.1 of TreeTagger.\n\n### Python\n\nThis script runs in Python 2.7 and requires two external packages to run: [lxml](http://lxml.de/) and [treetaggerwrapper](http://treetaggerwrapper.readthedocs.io/en/latest/). The latter requires [six](https://pythonhosted.org/six/) to be installed as well. You can install these packages either locally (in a [virtualenv](http://virtualenv.readthedocs.io/en/latest/)) or globally via running:\n\n\tpip install -r requirements.txt\n\n## Running the script\n\nBefore running the script, it's best to set an environment variable with the location of TreeTagger. The treetaggerwrapper tries to detect the installation automatically, but this is not fool-proof. You can set the environment variable (under Linux) with:\n\n\texport TAGDIR=/opt/treetagger/\n\nAlternatively, you can modify `process.py` and hard-code your installation path in the TreeTagger instantation.\n\nThen, you can run the `process.py` script. It requires two parameters: your language of choice for parsing and lemmatizing, and your input file(s). In the `examples/` directory you can find some example .xml-files. Run\n\n\tpython process.py en examples/en.xml\n\nto process the English example. The resulting file will be named `examples/en-out.xml`.\n\n\n", "description_content_type": "text/markdown", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/time-in-translation/treetagger-xml", "keywords": "", "license": "MIT", "maintainer": "", "maintainer_email": "", "name": "treetagger-xml", "package_url": "https://pypi.org/project/treetagger-xml/", "platform": "", "project_url": "https://pypi.org/project/treetagger-xml/", "project_urls": { "Homepage": "https://github.com/time-in-translation/treetagger-xml" }, "release_url": "https://pypi.org/project/treetagger-xml/0.1.3/", "requires_dist": [ "lxml", "six", "treetaggerwrapper" ], "requires_python": "", "summary": "Reads .xml-files and parses these with TreeTagger", "version": "0.1.3" }, "last_serial": 4247521, "releases": { "0.1": [ { "comment_text": "", "digests": { "md5": "fbbbe82560ffff9cc553985a99e31675", "sha256": "a4b819c165f6e2376d1805e8eb25da9a3e9e2d2784fb132d1c9c010830a76961" }, "downloads": -1, "filename": "treetagger_xml-0.1-py2-none-any.whl", "has_sig": false, "md5_digest": "fbbbe82560ffff9cc553985a99e31675", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 4452, "upload_time": "2018-09-05T11:46:40", "url": "https://files.pythonhosted.org/packages/f7/56/ba2bdf0dde5a58d88ae798179afc68328bab79549c9a73f4c76bc15c9eeb/treetagger_xml-0.1-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "31721730913a042dbb457b2ab29050c7", "sha256": "87055506c61aa6dd21ec50e52a2f0304e162f2d178d507f315612919652a8026" }, "downloads": -1, "filename": "treetagger-xml-0.1.tar.gz", "has_sig": false, "md5_digest": "31721730913a042dbb457b2ab29050c7", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 3993, "upload_time": "2018-09-05T11:46:42", "url": "https://files.pythonhosted.org/packages/4e/1a/c5e3ab63a9ffa054f729c49bef1c3f73ecce919a7f923db5de2bd14f5ffb/treetagger-xml-0.1.tar.gz" } ], "0.1.1": [ { "comment_text": "", "digests": { "md5": "a612c4b74b2b3c9f7192eef9cac09cba", "sha256": "522866566ead9996d6c62a8e34814dd2dfdeb0bdcae8dab12124285490625772" }, "downloads": -1, "filename": "treetagger_xml-0.1.1-py2-none-any.whl", "has_sig": false, "md5_digest": "a612c4b74b2b3c9f7192eef9cac09cba", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 4510, "upload_time": "2018-09-05T12:21:30", "url": "https://files.pythonhosted.org/packages/9d/a5/32f67cc164d88e1a3ebc3cb367756468c78dd26dff39958e4f5076555faf/treetagger_xml-0.1.1-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "bb5cf676855d9c4cc12bbeab9835f46e", "sha256": "f82ff624f58ef347202a7c862f34ad19acd55928ed154a5f9db2609e27ae56ce" }, "downloads": -1, "filename": "treetagger-xml-0.1.1.tar.gz", "has_sig": false, "md5_digest": "bb5cf676855d9c4cc12bbeab9835f46e", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4095, "upload_time": "2018-09-05T12:21:33", "url": "https://files.pythonhosted.org/packages/f7/eb/88023e57c13737d68535b78728c3b21609ffefa7876a1af5abf7fbbc7439/treetagger-xml-0.1.1.tar.gz" } ], "0.1.2": [ { "comment_text": "", "digests": { "md5": "3682c7bfaaddb692c47efc20dd34c217", "sha256": "6ee7648ff55c1253bcdc466f40ef9e8305f3eb2d002bae58bc4b61d48f4259ec" }, "downloads": -1, "filename": "treetagger_xml-0.1.2-py2-none-any.whl", "has_sig": false, "md5_digest": "3682c7bfaaddb692c47efc20dd34c217", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 7106, "upload_time": "2018-09-06T10:09:04", "url": "https://files.pythonhosted.org/packages/2c/13/bb82e517267df58ee01fb352b6c358cd5e97b4cb97bb8aae5dec9b267ced/treetagger_xml-0.1.2-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "5df062d2ba33cbc3b08ec7b3fdeaa9c6", "sha256": "37f4cfd60023545c24cec229dc89cbb968f90691952ff67ed963ef338033bab1" }, "downloads": -1, "filename": "treetagger-xml-0.1.2.tar.gz", "has_sig": false, "md5_digest": "5df062d2ba33cbc3b08ec7b3fdeaa9c6", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4050, "upload_time": "2018-09-06T10:09:05", "url": "https://files.pythonhosted.org/packages/09/60/3ab2b83153d0fc45329ffe9b6f2b36c956239b584fd5a7a445001901e3ec/treetagger-xml-0.1.2.tar.gz" } ], "0.1.3": [ { "comment_text": "", "digests": { "md5": "6c4c2b09d75f9140f93e76ec06d366e0", "sha256": "b34b16a2629e2c2a59f5cc90014ef9e05079081d5e04186e1d2a288e6accc8e9" }, "downloads": -1, "filename": "treetagger_xml-0.1.3-py2-none-any.whl", "has_sig": false, "md5_digest": "6c4c2b09d75f9140f93e76ec06d366e0", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 5502, "upload_time": "2018-09-07T08:08:35", "url": "https://files.pythonhosted.org/packages/f3/b3/b6033d6ac36396d04ff8d2d7fd7d7c5c4e137d8f55d87bf2e9aeb2481795/treetagger_xml-0.1.3-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "70a6209dff280c37cc7ea38dde74c791", "sha256": "3fd60de88ecc04de01855fc0987ab7bd7128f912fad2fa4e8d66a3af8ad6f5d4" }, "downloads": -1, "filename": "treetagger-xml-0.1.3.tar.gz", "has_sig": false, "md5_digest": "70a6209dff280c37cc7ea38dde74c791", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4266, "upload_time": "2018-09-07T08:08:36", "url": "https://files.pythonhosted.org/packages/f6/2d/786c3fa1bb66f91836882a40b5ae1a83c02dc3663efdb9d11f70f926e823/treetagger-xml-0.1.3.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "6c4c2b09d75f9140f93e76ec06d366e0", "sha256": "b34b16a2629e2c2a59f5cc90014ef9e05079081d5e04186e1d2a288e6accc8e9" }, "downloads": -1, "filename": "treetagger_xml-0.1.3-py2-none-any.whl", "has_sig": false, "md5_digest": "6c4c2b09d75f9140f93e76ec06d366e0", "packagetype": "bdist_wheel", "python_version": "py2", "requires_python": null, "size": 5502, "upload_time": "2018-09-07T08:08:35", "url": "https://files.pythonhosted.org/packages/f3/b3/b6033d6ac36396d04ff8d2d7fd7d7c5c4e137d8f55d87bf2e9aeb2481795/treetagger_xml-0.1.3-py2-none-any.whl" }, { "comment_text": "", "digests": { "md5": "70a6209dff280c37cc7ea38dde74c791", "sha256": "3fd60de88ecc04de01855fc0987ab7bd7128f912fad2fa4e8d66a3af8ad6f5d4" }, "downloads": -1, "filename": "treetagger-xml-0.1.3.tar.gz", "has_sig": false, "md5_digest": "70a6209dff280c37cc7ea38dde74c791", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 4266, "upload_time": "2018-09-07T08:08:36", "url": "https://files.pythonhosted.org/packages/f6/2d/786c3fa1bb66f91836882a40b5ae1a83c02dc3663efdb9d11f70f926e823/treetagger-xml-0.1.3.tar.gz" } ] }