{ "info": { "author": "Aaron Halfaker", "author_email": "aaron.halfaker@gmail.com", "bugtrack_url": null, "classifiers": [ "Environment :: Other Environment", "Intended Audience :: Developers", "License :: OSI Approved :: MIT License", "Operating System :: OS Independent", "Programming Language :: Python", "Programming Language :: Python :: 3", "Programming Language :: Python :: 3 :: Only", "Topic :: Scientific/Engineering", "Topic :: Software Development :: Libraries :: Python Modules", "Topic :: Text Processing :: General", "Topic :: Text Processing :: Linguistic", "Topic :: Utilities" ], "description": "# MediaWiki XML\n\nThis library contains a collection of utilities for efficiently \nprocessing MediaWiki\u2019s XML database dumps. There are two \nimportant concerns that this module intends to address: \ncomplexity and performance of streaming XML parsing. This library\nenables memory efficent stream processing of XML dumps with \na simple [`iterator`](https://pythonhosted.org/mwxml/iteration.html) \nstrategy. This library also implements a distributed\nprocessing strategy (see \n[`map()`](https://pythonhosted.org/mwxml/map.html)) that enables parallel\nprocessing of many XML dump files at the same time. \n\n* **Installation:** ``pip install mwxml``\n* **Documentation:** https://pythonhosted.org/mwxml\n* **Repositiory:** https://github.com/mediawiki-utilities/python-mwxml\n* **License:** MIT\n\n## Example\n\n >>> import mwxml\n >>>\n >>> dump = mwxml.Dump.from_file(open(\"dump.xml\"))\n >>> print(dump.site_info.name, dump.site_info.dbname)\n Wikipedia enwiki\n >>>\n >>> for page in dump:\n ... for revision in page:\n ... print(revision.id)\n ...\n 1\n 2\n 3\n \n## Author\n* Aaron Halfaker -- https://github.com/halfak\n\n## See also \n* http://dumps.wikimedia.org/\n* http://community.wikia.com/wiki/Help:Database_download", "description_content_type": null, "docs_url": "https://pythonhosted.org/mwxml/", "download_url": "UNKNOWN", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/mediawiki-utilities/python-mwxml", "keywords": null, "license": "MIT", "maintainer": null, "maintainer_email": null, "name": "mwxml", "package_url": "https://pypi.org/project/mwxml/", "platform": "UNKNOWN", "project_url": "https://pypi.org/project/mwxml/", "project_urls": { "Download": "UNKNOWN", "Homepage": "https://github.com/mediawiki-utilities/python-mwxml" }, "release_url": "https://pypi.org/project/mwxml/0.3.3/", "requires_dist": null, "requires_python": null, "summary": "A set of utilities for processing MediaWiki XML dump data.", "version": "0.3.3" }, "last_serial": 2994958, "releases": { "0.0.1": [ { "comment_text": "", "digests": { "md5": "b5c742ce6d679ba07f01e224639915d1", "sha256": "11a71a095a0c7be8ed75f78c83ff59a2321a9bd7278d11855619e8f6e21f0bd4" }, "downloads": -1, "filename": "mwxml-0.0.1.tar.gz", "has_sig": false, "md5_digest": "b5c742ce6d679ba07f01e224639915d1", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12169, "upload_time": "2015-08-24T21:13:38", "url": "https://files.pythonhosted.org/packages/a9/15/918042ee81178d76d6ba137786ac9f1506c5a6b48657fa7bfbec40909896/mwxml-0.0.1.tar.gz" }, { "comment_text": "", "digests": { "md5": "fc1e1c7bd8baba2762ede54f106c8ba4", "sha256": "c78e8833699a28b5f5e6d400920439025576bde586fddb962adf5e0021cc4ae2" }, "downloads": -1, "filename": "mwxml-0.0.1.zip", "has_sig": false, "md5_digest": "fc1e1c7bd8baba2762ede54f106c8ba4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 22004, "upload_time": "2015-08-24T21:13:47", "url": "https://files.pythonhosted.org/packages/32/7b/1ec66888f6e730ff74300a159f475e2681fce6a1fca2344169b67815da3b/mwxml-0.0.1.zip" } ], "0.0.2": [ { "comment_text": "", "digests": { "md5": "95c9e73327ad5289cfe6e399610c0cef", "sha256": "dbdafcfaf398637c1dc45a16eaa81886a0bea52f471aee6592d6c89d291a7142" }, "downloads": -1, "filename": "mwxml-0.0.2.tar.gz", "has_sig": false, "md5_digest": "95c9e73327ad5289cfe6e399610c0cef", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12249, "upload_time": "2015-08-24T21:20:57", "url": "https://files.pythonhosted.org/packages/17/42/3ebefcb98476462b7c3c64fbc401b027900ddee0c0db4d6ca937e6c53a8d/mwxml-0.0.2.tar.gz" }, { "comment_text": "", "digests": { "md5": "55016c180d7c6fd0061e67cacfd624ce", "sha256": "33d4a82833097ce2c7fbad3a74a362857856119ad51c1aea10695637d4461a9e" }, "downloads": -1, "filename": "mwxml-0.0.2.zip", "has_sig": false, "md5_digest": "55016c180d7c6fd0061e67cacfd624ce", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 22203, "upload_time": "2015-08-24T21:21:17", "url": "https://files.pythonhosted.org/packages/15/91/aa16bda45c5fc8a2931c781c4b82c47bd6aa99e13e3d3d91138b4ec62927/mwxml-0.0.2.zip" } ], "0.0.3": [ { "comment_text": "", "digests": { "md5": "dd708bdf26224f2344148081aa381c95", "sha256": "006fae1ae641656213d2b16514d4336b10170946a3fc075734267bf23d19e6f2" }, "downloads": -1, "filename": "mwxml-0.0.3.tar.gz", "has_sig": false, "md5_digest": "dd708bdf26224f2344148081aa381c95", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12353, "upload_time": "2015-08-24T22:34:40", "url": "https://files.pythonhosted.org/packages/c6/df/bb0147980b24197f79c7fe1662d2113f18e1a41bd121bae1ef10ec84c5c1/mwxml-0.0.3.tar.gz" }, { "comment_text": "", "digests": { "md5": "a4395b55be9f910832cc1fef8e81b512", "sha256": "bc36f06d30c4625ca5d00abe88663360dcb3438eedc73dbfae6eab6f210115a3" }, "downloads": -1, "filename": "mwxml-0.0.3.zip", "has_sig": false, "md5_digest": "a4395b55be9f910832cc1fef8e81b512", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 22482, "upload_time": "2015-08-24T22:34:46", "url": "https://files.pythonhosted.org/packages/56/f0/02ce4988799f338958d3c66302ad4a4ab923c92425a93efd9282aeef6ef5/mwxml-0.0.3.zip" } ], "0.0.4": [ { "comment_text": "", "digests": { "md5": "bbc7758f74a66acbd4dbbea041c3c6b6", "sha256": "41b61105bc8fa6c44e1e0c88c097da27a63eaa8cdf2216802085056ddf4732db" }, "downloads": -1, "filename": "mwxml-0.0.4.tar.gz", "has_sig": false, "md5_digest": "bbc7758f74a66acbd4dbbea041c3c6b6", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12343, "upload_time": "2015-08-25T19:20:43", "url": "https://files.pythonhosted.org/packages/d9/1a/4d52ee7faa6d7c0cd9839e64c8acaf5d4a489ec11d60abd6b8baeb30ab51/mwxml-0.0.4.tar.gz" }, { "comment_text": "", "digests": { "md5": "a395ff3da4db63fb37051364f7b63c5d", "sha256": "50426c5c6f8de748401cad7058b4db2d4388a4999de2187682eac4636035dc75" }, "downloads": -1, "filename": "mwxml-0.0.4.zip", "has_sig": false, "md5_digest": "a395ff3da4db63fb37051364f7b63c5d", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 23616, "upload_time": "2015-08-25T19:20:48", "url": "https://files.pythonhosted.org/packages/55/c9/4859c2a7d9b59ace3792b878a6f8f7f322e0fb2221d4868da6b9a27c5ea1/mwxml-0.0.4.zip" } ], "0.1.0": [ { "comment_text": "", "digests": { "md5": "9dc308b5b76480bb22bb25e101767f7f", "sha256": "ac6c3b6edf3a337ef874ad9a73fb90fe087ed4b90a622472bc82e1b95e07fbc6" }, "downloads": -1, "filename": "mwxml-0.1.0.tar.gz", "has_sig": false, "md5_digest": "9dc308b5b76480bb22bb25e101767f7f", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 13465, "upload_time": "2015-08-27T16:09:53", "url": "https://files.pythonhosted.org/packages/32/d4/fccecedd219fb013ef4a7babd51444645d3de547baf44d260e7dde39fa1e/mwxml-0.1.0.tar.gz" }, { "comment_text": "", "digests": { "md5": "0af1c90763f924cb1ef38f748e44d1fa", "sha256": "0d583b3a79a9692fcf2782ab684704dc51e91a6b6384a964ff2d23ee74c46639" }, "downloads": -1, "filename": "mwxml-0.1.0.zip", "has_sig": false, "md5_digest": "0af1c90763f924cb1ef38f748e44d1fa", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 23745, "upload_time": "2015-08-27T16:09:56", "url": "https://files.pythonhosted.org/packages/4e/89/5115b3b11547c3ee3d2830f78b39b03272b0e450c1e606b70840e3a73f6b/mwxml-0.1.0.zip" } ], "0.1.1": [ { "comment_text": "", "digests": { "md5": "88dae301843636eb6a96bd3c7ef1cd0e", "sha256": "3e80068b08f081bf72fef2b34e3b28c3de00ca1c21f0ae7ce536a7bd726de7c0" }, "downloads": -1, "filename": "mwxml-0.1.1.tar.gz", "has_sig": false, "md5_digest": "88dae301843636eb6a96bd3c7ef1cd0e", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12696, "upload_time": "2015-09-09T16:46:49", "url": "https://files.pythonhosted.org/packages/89/03/b1133ea1fd0dfe2d9d0866abefd0c002e878090a0325c800bb14162a823e/mwxml-0.1.1.tar.gz" }, { "comment_text": "", "digests": { "md5": "5fa3e7f6fa11ddca9b31a26f43ea7996", "sha256": "6de9db8bcfb40edfad1120c706b24223403cd8bf860019f874feb565efdfac3d" }, "downloads": -1, "filename": "mwxml-0.1.1.zip", "has_sig": false, "md5_digest": "5fa3e7f6fa11ddca9b31a26f43ea7996", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 22864, "upload_time": "2015-09-09T16:46:52", "url": "https://files.pythonhosted.org/packages/5a/03/c49eaca263b79e7f378e47fc455beeb25cf887ff24a345e2f7bb78e2c1e4/mwxml-0.1.1.zip" } ], "0.2.0": [ { "comment_text": "", "digests": { "md5": "d0da58d980e539255266106e10f529b1", "sha256": "1ac0860920d57880b58b8677a175429b1753b86a04a51469c84e2511824fab5c" }, "downloads": -1, "filename": "mwxml-0.2.0.tar.gz", "has_sig": false, "md5_digest": "d0da58d980e539255266106e10f529b1", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 12852, "upload_time": "2015-09-24T19:55:00", "url": "https://files.pythonhosted.org/packages/e3/80/9d673aee22c3e3a34955f377dbbe365248a32acddeeab475e9d2eb630254/mwxml-0.2.0.tar.gz" }, { "comment_text": "", "digests": { "md5": "c5d7392ddd7d8b3dd4f55fc4111c564b", "sha256": "da0f9b0197947cfc3b827831f28eb67b906d1114fe88937ec3f23f0b5469ba0f" }, "downloads": -1, "filename": "mwxml-0.2.0.zip", "has_sig": false, "md5_digest": "c5d7392ddd7d8b3dd4f55fc4111c564b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 23665, "upload_time": "2015-09-24T19:55:11", "url": "https://files.pythonhosted.org/packages/03/70/2597e7a25f0a914cc6ed4a5ebda6a6e3354289767e954759dbd1f745872f/mwxml-0.2.0.zip" } ], "0.2.1": [ { "comment_text": "", "digests": { "md5": "6fc035e7a9e25342e57aa648f4a559d8", "sha256": "ad49b9251fd8d5fd5ad30dfff571fb8e4d8015426bb831336be551961417b0e6" }, "downloads": -1, "filename": "mwxml-0.2.1-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "6fc035e7a9e25342e57aa648f4a559d8", "packagetype": "bdist_wheel", "python_version": "3.4", "requires_python": null, "size": 29115, "upload_time": "2015-10-10T16:44:56", "url": "https://files.pythonhosted.org/packages/43/b3/75c580fd467243347f1b7ad4ce5435d74a2b1ffd124f57c9ca8998a655d0/mwxml-0.2.1-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "c1043c56d0cc60ddb2b5cdc1d644d824", "sha256": "29dd86a8783532afb72523c7a9445be08c4814e6ffa64a00db966e2e548da6b6" }, "downloads": -1, "filename": "mwxml-0.2.1.tar.gz", "has_sig": false, "md5_digest": "c1043c56d0cc60ddb2b5cdc1d644d824", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 13620, "upload_time": "2015-10-10T16:44:52", "url": "https://files.pythonhosted.org/packages/9a/6f/e3cdea7a15b2c0a085c1a730210cfb22ef4d39dcf067e51450ef5119ba85/mwxml-0.2.1.tar.gz" } ], "0.2.2": [ { "comment_text": "", "digests": { "md5": "cedb7d210b883afbe21fb6b81f5e5bce", "sha256": "5a92ed56eceb5a282d68fade4451583bbd0eda411b831003f6e7b087471cb5d5" }, "downloads": -1, "filename": "mwxml-0.2.2.tar.gz", "has_sig": false, "md5_digest": "cedb7d210b883afbe21fb6b81f5e5bce", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 13901, "upload_time": "2016-05-03T20:05:37", "url": "https://files.pythonhosted.org/packages/e6/71/2f2c1c72f9293b663e17bba6d714cc78dbb1972a2106857eca20048a716a/mwxml-0.2.2.tar.gz" } ], "0.3.0": [ { "comment_text": "", "digests": { "md5": "4c2ae1e75cb4b0683be75e700bb9e35a", "sha256": "8c2f0027e4d30e3a415b0b8eff8e88ecb8d828738a8820a7420214ab61f545f5" }, "downloads": -1, "filename": "mwxml-0.3.0-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "4c2ae1e75cb4b0683be75e700bb9e35a", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 32328, "upload_time": "2017-05-03T15:47:15", "url": "https://files.pythonhosted.org/packages/f4/2d/067ca56ed7750a26649d7930b847d81e7fdbc111ece01d74cf1e28e1067d/mwxml-0.3.0-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "a1c54983707fe0173c70cbfd3ea9ba07", "sha256": "bf1978536784ae3f5cc373eefff918c3f60190ddca2f672e962774eb4076bfac" }, "downloads": -1, "filename": "mwxml-0.3.0.tar.gz", "has_sig": false, "md5_digest": "a1c54983707fe0173c70cbfd3ea9ba07", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 15997, "upload_time": "2017-05-03T15:47:12", "url": "https://files.pythonhosted.org/packages/e7/a0/ca47e8e2c80563efeb9e1792a12f4c319cae72dd0e9e7e6b20a3f736f362/mwxml-0.3.0.tar.gz" } ], "0.3.1": [ { "comment_text": "", "digests": { "md5": "9e482a2b7503bdffbad554db51e2b1b1", "sha256": "84d032d99ae6f7767a83d2fb5901617a04648f8ad6380a5823c6b7de21c2e8be" }, "downloads": -1, "filename": "mwxml-0.3.1-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "9e482a2b7503bdffbad554db51e2b1b1", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 32388, "upload_time": "2017-05-04T14:48:57", "url": "https://files.pythonhosted.org/packages/00/6a/de5b0c4a7f765edb4567abd84dd751ed06a0e5fe2f0f9da5945318cf6df6/mwxml-0.3.1-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "48c94b2327295fcc2bb8b22f9714b6de", "sha256": "92763185cc2a10cb5edbcc9e938930f317e9ec1f81e7da0b20eeb294d3fd1ed6" }, "downloads": -1, "filename": "mwxml-0.3.1.tar.gz", "has_sig": false, "md5_digest": "48c94b2327295fcc2bb8b22f9714b6de", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 16054, "upload_time": "2017-05-04T14:48:56", "url": "https://files.pythonhosted.org/packages/1b/b3/3fecd3b3b4667acf13ff9f18f99a4106683c881043430337da632f12c1b5/mwxml-0.3.1.tar.gz" } ], "0.3.2": [ { "comment_text": "", "digests": { "md5": "71e2084b81ce2f2d006074099c8a677c", "sha256": "c3994bbae73ba3504474336697a3d825f7b882d12afed529cdf2789bce8fd6d6" }, "downloads": -1, "filename": "mwxml-0.3.2-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "71e2084b81ce2f2d006074099c8a677c", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 32579, "upload_time": "2017-07-01T19:10:35", "url": "https://files.pythonhosted.org/packages/9d/eb/c469cb2d3f3cebf97ea4429b5baf1aba5d8c0ada84f017cc83197b6c7684/mwxml-0.3.2-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "3d61e567173c2d518f7613cd803cb348", "sha256": "c8b992db787c84efc4e1342dbe102a4d4f245c318e9afdacf1e27b4db80b20f9" }, "downloads": -1, "filename": "mwxml-0.3.2.tar.gz", "has_sig": false, "md5_digest": "3d61e567173c2d518f7613cd803cb348", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 16257, "upload_time": "2017-07-01T19:10:33", "url": "https://files.pythonhosted.org/packages/af/92/bc8f93824a1b6106e2b41f14ef934b3f4995f5b3bcc99abc90ea61fb34ec/mwxml-0.3.2.tar.gz" } ], "0.3.3": [ { "comment_text": "", "digests": { "md5": "aada108026d95ee371430c7ac8367477", "sha256": "9695848b8b6987b6f6addc2a8accba5b2bcbc543702598194e182b508ab568a9" }, "downloads": -1, "filename": "mwxml-0.3.3-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "aada108026d95ee371430c7ac8367477", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 32580, "upload_time": "2017-07-02T16:22:46", "url": "https://files.pythonhosted.org/packages/28/af/1277846ecfdc19d8ba9fd75cf5a180955f21709d52c98f8c20bec525de84/mwxml-0.3.3-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "092fbe06f705e55bf2b1ed0b8ee2c0cd", "sha256": "0848df0cf2e293718f554311acf4715bd679f639f4e52cbe47d8206589db1d31" }, "downloads": -1, "filename": "mwxml-0.3.3.tar.gz", "has_sig": false, "md5_digest": "092fbe06f705e55bf2b1ed0b8ee2c0cd", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 16274, "upload_time": "2017-07-02T16:22:43", "url": "https://files.pythonhosted.org/packages/ab/47/4e9fc0684370048b6673783409b410a840c62e4fd34164ba177fe0d373c9/mwxml-0.3.3.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "aada108026d95ee371430c7ac8367477", "sha256": "9695848b8b6987b6f6addc2a8accba5b2bcbc543702598194e182b508ab568a9" }, "downloads": -1, "filename": "mwxml-0.3.3-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "aada108026d95ee371430c7ac8367477", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 32580, "upload_time": "2017-07-02T16:22:46", "url": "https://files.pythonhosted.org/packages/28/af/1277846ecfdc19d8ba9fd75cf5a180955f21709d52c98f8c20bec525de84/mwxml-0.3.3-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "092fbe06f705e55bf2b1ed0b8ee2c0cd", "sha256": "0848df0cf2e293718f554311acf4715bd679f639f4e52cbe47d8206589db1d31" }, "downloads": -1, "filename": "mwxml-0.3.3.tar.gz", "has_sig": false, "md5_digest": "092fbe06f705e55bf2b1ed0b8ee2c0cd", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 16274, "upload_time": "2017-07-02T16:22:43", "url": "https://files.pythonhosted.org/packages/ab/47/4e9fc0684370048b6673783409b410a840c62e4fd34164ba177fe0d373c9/mwxml-0.3.3.tar.gz" } ] }