{ "info": { "author": "Patricio Cerda", "author_email": "patricio.cerda@inria.fr", "bugtrack_url": null, "classifiers": [ "Development Status :: 2 - Pre-Alpha", "Environment :: Console", "Intended Audience :: Science/Research", "License :: OSI Approved :: BSD License", "Operating System :: OS Independent", "Programming Language :: Python :: 3.5", "Programming Language :: Python :: 3.6", "Topic :: Scientific/Engineering", "Topic :: Software Development :: Libraries" ], "description": "dirty_cat\n=========\n\ndirty_cat is a Python module for machine-learning on dirty categorical variables.\n\nWebsite: https://dirty-cat.github.io/\n\nFor a detailed description of the problem of encoding dirty categorical data,\nsee `Similarity encoding for learning with dirty categorical variables\n`_ [1]_.\n\nInstallation\n------------\n\nDependencies\n~~~~~~~~~~~~\n\ndirty_cat requires:\n\n- Python (>= 3.5)\n- NumPy (>= 1.8.2)\n- SciPy (>= 1.0.1)\n- scikit-learn (>= 0.20.0)\n\nOptional dependency:\n\n- python-Levenshtein for faster edit distances (not used for the n-gram\n distance)\n\nUser installation\n~~~~~~~~~~~~~~~~~\n\nIf you already have a working installation of NumPy and SciPy,\nthe easiest way to install dirty_cat is using ``pip`` ::\n\n pip install -U --user dirty_cat\n\nOther implementations\n~~~~~~~~~~~~~~~~~~~~~~\n\n- Spark ML: https://github.com/rakutentech/spark-dirty-cat\n\n\nReferences\n~~~~~~~~~~\n\n.. [1] Patricio Cerda, Ga\u00ebl Varoquaux, Bal\u00e1zs K\u00e9gl. Similarity encoding for learning with dirty categorical variables. 2018, Machine Learning journal, Springer.\n", "description_content_type": "", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://dirty-cat.github.io/", "keywords": "", "license": "BSD", "maintainer": "", "maintainer_email": "", "name": "dirty_cat", "package_url": "https://pypi.org/project/dirty_cat/", "platform": "any", "project_url": "https://pypi.org/project/dirty_cat/", "project_urls": { "Homepage": "http://dirty-cat.github.io/" }, "release_url": "https://pypi.org/project/dirty_cat/0.0.5/", "requires_dist": null, "requires_python": "", "summary": "Machine learning with dirty categories.", "version": "0.0.5" }, "last_serial": 4504900, "releases": { "0.0.1": [ { "comment_text": "", "digests": { "md5": "061aa1cae603a4dd01ec2edcdea41bb4", "sha256": "48ff62d45cd605cb11964845a50707dd9c2d207c9aa8f42afd7e6f7f1000778a" }, "downloads": -1, "filename": "dirty_cat-0.0.1.tar.gz", "has_sig": false, "md5_digest": "061aa1cae603a4dd01ec2edcdea41bb4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 8729, "upload_time": "2018-06-08T11:58:04", "url": "https://files.pythonhosted.org/packages/f1/ac/fbc68ed60656b2065866d1ee1e7b9e038d0980473522e9682fef40036834/dirty_cat-0.0.1.tar.gz" } ], "0.0.1a0": [ { "comment_text": "", "digests": { "md5": "18cb59dc209ec0e0d4b94328a74e9b1f", "sha256": "16f7c715168a2a76e8335f7d03216c44561b86e38121669ae2748d64bf8b5819" }, "downloads": -1, "filename": "dirty_cat-0.0.1a0.tar.gz", "has_sig": false, "md5_digest": "18cb59dc209ec0e0d4b94328a74e9b1f", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 414940, "upload_time": "2018-03-19T21:42:30", "url": "https://files.pythonhosted.org/packages/f4/e0/9dfd7cbe631baa147919baf53562520ad4b6aa6f1efd41f1784a8b496e83/dirty_cat-0.0.1a0.tar.gz" } ], "0.0.1b1": [ { "comment_text": "", "digests": { "md5": "441c78fbda93f02910b1c8c6e8c25a60", "sha256": "ce8ecf084e86efd87133610181ad5d079d16d1b9818b6a92b13b09c2cf6ba110" }, "downloads": -1, "filename": "dirty_cat-0.0.1b1.tar.gz", "has_sig": false, "md5_digest": "441c78fbda93f02910b1c8c6e8c25a60", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 415235, "upload_time": "2018-03-20T17:58:28", "url": "https://files.pythonhosted.org/packages/f1/b8/3832edee0bc0635f845232f32181a55a37d086e08356118bca1bf4577adb/dirty_cat-0.0.1b1.tar.gz" } ], "0.0.1b2": [ { "comment_text": "", "digests": { "md5": "8ab203a3e79d768132008fa248998c1b", "sha256": "e5055ffa83bcdf84d766d3672fb78e3d3fdebe9fcb4e05df438a96102cb97016" }, "downloads": -1, "filename": "dirty_cat-0.0.1b2.tar.gz", "has_sig": false, "md5_digest": "8ab203a3e79d768132008fa248998c1b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 417186, "upload_time": "2018-03-27T09:19:46", "url": "https://files.pythonhosted.org/packages/0f/7c/4a363577547221175afb64340274dfe2805494da126e4836d4ec921f42ad/dirty_cat-0.0.1b2.tar.gz" } ], "0.0.1b3": [ { "comment_text": "", "digests": { "md5": "70ca4b232f863d0cb3a1a2ab6ff2de20", "sha256": "8c26eb84e31d5b430318ab59044634b3c5737c1b56073fd180fba9b9d8d7fbfe" }, "downloads": -1, "filename": "dirty_cat-0.0.1b3.tar.gz", "has_sig": false, "md5_digest": "70ca4b232f863d0cb3a1a2ab6ff2de20", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 417040, "upload_time": "2018-03-30T09:06:38", "url": "https://files.pythonhosted.org/packages/e5/2a/17bc08dc198be8ecbe968200e0cc86701b4765ad6b55ba8412d090997dd3/dirty_cat-0.0.1b3.tar.gz" } ], "0.0.2": [ { "comment_text": "", "digests": { "md5": "de3707a57a32e6af0cb02ccd2b0145db", "sha256": "afb84e6a04722373e8c5d5ea53948a67f164199baf9d0cadaf0187053708b896" }, "downloads": -1, "filename": "dirty_cat-0.0.2-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "de3707a57a32e6af0cb02ccd2b0145db", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 86959, "upload_time": "2018-11-06T06:37:07", "url": "https://files.pythonhosted.org/packages/a5/56/5cadefed4741a609df939f966aa0fd8b5e7c44a8b03e5a076b28c2fa243b/dirty_cat-0.0.2-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "e0e4a9a40a95a0a089cf224f8aecbf71", "sha256": "f7af2d5749ab6c5b0c1f2064abce806c67d4829a43bbbb7ea13c47e403c0e192" }, "downloads": -1, "filename": "dirty_cat-0.0.2.tar.gz", "has_sig": false, "md5_digest": "e0e4a9a40a95a0a089cf224f8aecbf71", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 75514, "upload_time": "2018-11-06T06:36:41", "url": "https://files.pythonhosted.org/packages/e0/e6/46418a29dbf80d17548190ef68589a6fe31973a42bcef27b1be9618bf3ed/dirty_cat-0.0.2.tar.gz" } ], "0.0.3": [ { "comment_text": "", "digests": { "md5": "270fd736b7e5c7da8a4ff25cffb3ead6", "sha256": "157e7aa4fb6dd63b644aa094099b29bc96461492bcb83d6474d8b8153943712a" }, "downloads": -1, "filename": "dirty_cat-0.0.3-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "270fd736b7e5c7da8a4ff25cffb3ead6", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 91231, "upload_time": "2018-11-19T21:59:31", "url": "https://files.pythonhosted.org/packages/69/d0/5de16e3c105d571fc464b71beb60d03651862fe4c7dbfe31761681c11b65/dirty_cat-0.0.3-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "8b1db8d709827524b380dfb82b1969cf", "sha256": "487f5e0c0a86a4afc267f38dad2a2d5046bcda91cb4e20e702962a907635637f" }, "downloads": -1, "filename": "dirty_cat-0.0.3.tar.gz", "has_sig": false, "md5_digest": "8b1db8d709827524b380dfb82b1969cf", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 79987, "upload_time": "2018-11-19T21:59:28", "url": "https://files.pythonhosted.org/packages/24/c1/60ef2763a69a62c11ab31809f9e04a600ebf274fae34b178c2767c2c0b0e/dirty_cat-0.0.3.tar.gz" } ], "0.0.4": [ { "comment_text": "", "digests": { "md5": "44fd99605c879a3fe6bde622cdbd1f26", "sha256": "45a257a16174bc7630868a6214355e3f84a291d979fca78bc469bb1101e11450" }, "downloads": -1, "filename": "dirty_cat-0.0.4-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "44fd99605c879a3fe6bde622cdbd1f26", "packagetype": "bdist_wheel", "python_version": "2.7", "requires_python": null, "size": 91212, "upload_time": "2018-11-19T22:11:02", "url": "https://files.pythonhosted.org/packages/9c/91/eb6259f92a4dcce4a108e7307ed1cfc14d98c0ca53281c99297a7457fb32/dirty_cat-0.0.4-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "05e15bdb6bab3152a257dd127834f8fd", "sha256": "42ea3bcfbe3827b2868c598133a9fe174a1f12bec14db16f76c57b45497b3b51" }, "downloads": -1, "filename": "dirty_cat-0.0.4.tar.gz", "has_sig": false, "md5_digest": "05e15bdb6bab3152a257dd127834f8fd", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 79980, "upload_time": "2018-11-19T22:10:59", "url": "https://files.pythonhosted.org/packages/88/4a/86968c5f808ffb9d22139c8544b71f84d37fb6fea70270b409767222a32b/dirty_cat-0.0.4.tar.gz" } ], "0.0.5": [ { "comment_text": "", "digests": { "md5": "1f2d589cc345715fd69b82d91c4e631e", "sha256": "b1d78d173843364e8922f57fa39a1b7d813f083e894c87d4674e742ae8ef252e" }, "downloads": -1, "filename": "dirty_cat-0.0.5-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "1f2d589cc345715fd69b82d91c4e631e", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 91211, "upload_time": "2018-11-19T22:42:06", "url": "https://files.pythonhosted.org/packages/8d/84/7de88b45593b71fe8552c3038232502337eb3c0bd4b296361849a20fdabc/dirty_cat-0.0.5-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "2813fb0761d8b9ec4c970f6e2d85b394", "sha256": "30a7051e2485d4396a24c129660f292721b78c58e1942bfb42f721a5ac38930e" }, "downloads": -1, "filename": "dirty_cat-0.0.5.tar.gz", "has_sig": false, "md5_digest": "2813fb0761d8b9ec4c970f6e2d85b394", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 79982, "upload_time": "2018-11-19T22:42:03", "url": "https://files.pythonhosted.org/packages/c6/b4/6b32a7efa37aa6463f5b43629dfe3ffd59fdf2f49ba7f9bd352722deb06d/dirty_cat-0.0.5.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "1f2d589cc345715fd69b82d91c4e631e", "sha256": "b1d78d173843364e8922f57fa39a1b7d813f083e894c87d4674e742ae8ef252e" }, "downloads": -1, "filename": "dirty_cat-0.0.5-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "1f2d589cc345715fd69b82d91c4e631e", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 91211, "upload_time": "2018-11-19T22:42:06", "url": "https://files.pythonhosted.org/packages/8d/84/7de88b45593b71fe8552c3038232502337eb3c0bd4b296361849a20fdabc/dirty_cat-0.0.5-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "2813fb0761d8b9ec4c970f6e2d85b394", "sha256": "30a7051e2485d4396a24c129660f292721b78c58e1942bfb42f721a5ac38930e" }, "downloads": -1, "filename": "dirty_cat-0.0.5.tar.gz", "has_sig": false, "md5_digest": "2813fb0761d8b9ec4c970f6e2d85b394", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 79982, "upload_time": "2018-11-19T22:42:03", "url": "https://files.pythonhosted.org/packages/c6/b4/6b32a7efa37aa6463f5b43629dfe3ffd59fdf2f49ba7f9bd352722deb06d/dirty_cat-0.0.5.tar.gz" } ] }