{ "info": { "author": "Michele Lacchia", "author_email": "michelelacchia@gmail.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 3 - Alpha", "Programming Language :: Python", "Programming Language :: Python :: 2", "Programming Language :: Python :: 2.6", "Programming Language :: Python :: 2.7", "Programming Language :: Python :: 3", "Programming Language :: Python :: 3.1", "Programming Language :: Python :: 3.2", "Programming Language :: Python :: 3.3", "Programming Language :: Python :: 3.4", "Programming Language :: Python :: 3.5" ], "description": "sklearn-pdtransform\n-------------------\n\nInstallation:\n\n.. code::\n\n $ pip install pdtransform\n\nA little package with a few transformers to work with Pandas dataframes in the\nSklearn pipeline, which I found myself writing quite frequently. Example usage:\n\n.. code:: python\n\n from pdtransform import DFTransform, DFFeatureUnion\n\n pipeline = Pipeline([\n ('ordinal_to_nums', DFTransform(_ordinal_to_nums, copy=True)),\n ('union', DFFeatureUnion([\n ('categorical', Pipeline([\n ('select', DFTransform(lambda X: X.select_dtypes(include=['object']))),\n ('fill_na', DFTransform(lambda X: X.fillna('NA'))),\n ('one_hot', DFTransform(_one_hot_encode)),\n ])),\n ('numerical', Pipeline([\n ('select', DFTransform(lambda X: X.select_dtypes(exclude=['object']))),\n ('fill_median', DFTransform(lambda X: X.fillna(X.median()))),\n ('add_features', DFTransform(_add_features, copy=True)),\n ('remove_skew', DFTransform(_remove_skew, copy=True)),\n ('find_outliers', DFTransform(_find_outliers, copy=True)),\n ('normalize', DFTransform(lambda X: X.div(X.max())))\n ])),\n ])),\n ])\n\n\nFor more information read `this blog post `_.\n", "description_content_type": null, "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "http://signal-to-noise.xyz/why-you-should-use-scikit-learns-pipeline-object.html", "keywords": "sklearn pandas transformers pipeline", "license": "MIT", "maintainer": "", "maintainer_email": "", "name": "pdtransform", "package_url": "https://pypi.org/project/pdtransform/", "platform": "any", "project_url": "https://pypi.org/project/pdtransform/", "project_urls": { "Homepage": "http://signal-to-noise.xyz/why-you-should-use-scikit-learns-pipeline-object.html" }, "release_url": "https://pypi.org/project/pdtransform/0.2/", "requires_dist": null, "requires_python": "", "summary": "Sklearn transformers that work with Pandas dataframes", "version": "0.2" }, "last_serial": 3286385, "releases": { "0.1": [ { "comment_text": "", "digests": { "md5": "aee6860fae7cd3b050627ae08b3a9b7a", "sha256": "05203e7b552fc5782ab7e8ed8abb6b22d39a14292947417e5702ae35f376cfa1" }, "downloads": -1, "filename": "pdtransform-0.1-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "aee6860fae7cd3b050627ae08b3a9b7a", "packagetype": "bdist_wheel", "python_version": "3.5", "requires_python": null, "size": 3627, "upload_time": "2016-11-28T13:41:30", "url": "https://files.pythonhosted.org/packages/34/d8/2acd8d05c456037af125d02d4b6b3fab0c0188aeb9f2b1f90612c32b2f22/pdtransform-0.1-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "fc70d25618866deb7430f8627a66c39d", "sha256": "e7e765fa72a37b3eab22d322de75ecf3e7293401b4a7b944124ad65741350df1" }, "downloads": -1, "filename": "pdtransform-0.1.tar.gz", "has_sig": false, "md5_digest": "fc70d25618866deb7430f8627a66c39d", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2098, "upload_time": "2016-11-28T13:41:28", "url": "https://files.pythonhosted.org/packages/f5/f2/39cc8de1033b841b7e33c18d7d21f91c02669c006d6c58911f9aaac54426/pdtransform-0.1.tar.gz" } ], "0.2": [ { "comment_text": "", "digests": { "md5": "55b032f24af3eb172a8ab2bcc23093b0", "sha256": "88359e9649cc7d530b209731b97c3120d2d303f3f122e1593e94bdbe5468dfdc" }, "downloads": -1, "filename": "pdtransform-0.2-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "55b032f24af3eb172a8ab2bcc23093b0", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 3813, "upload_time": "2017-10-28T14:48:07", "url": "https://files.pythonhosted.org/packages/76/37/87df6568d24234b9d258d7a93bd549b01ef7572987dfa50a44c1c7466575/pdtransform-0.2-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "6a3e19899bf5ce22544a30dcbd322ac6", "sha256": "1ae101f7bfdaead85269b1dec5fd796f054bec491910a6d0430504645c44c628" }, "downloads": -1, "filename": "pdtransform-0.2.tar.gz", "has_sig": false, "md5_digest": "6a3e19899bf5ce22544a30dcbd322ac6", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2248, "upload_time": "2017-10-28T14:48:05", "url": "https://files.pythonhosted.org/packages/4e/6c/cf8b761f13811f6ba52ff41cd74730a1219c26c7b44130db5770c23cd5f5/pdtransform-0.2.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "55b032f24af3eb172a8ab2bcc23093b0", "sha256": "88359e9649cc7d530b209731b97c3120d2d303f3f122e1593e94bdbe5468dfdc" }, "downloads": -1, "filename": "pdtransform-0.2-py2.py3-none-any.whl", "has_sig": false, "md5_digest": "55b032f24af3eb172a8ab2bcc23093b0", "packagetype": "bdist_wheel", "python_version": "3.6", "requires_python": null, "size": 3813, "upload_time": "2017-10-28T14:48:07", "url": "https://files.pythonhosted.org/packages/76/37/87df6568d24234b9d258d7a93bd549b01ef7572987dfa50a44c1c7466575/pdtransform-0.2-py2.py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "6a3e19899bf5ce22544a30dcbd322ac6", "sha256": "1ae101f7bfdaead85269b1dec5fd796f054bec491910a6d0430504645c44c628" }, "downloads": -1, "filename": "pdtransform-0.2.tar.gz", "has_sig": false, "md5_digest": "6a3e19899bf5ce22544a30dcbd322ac6", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2248, "upload_time": "2017-10-28T14:48:05", "url": "https://files.pythonhosted.org/packages/4e/6c/cf8b761f13811f6ba52ff41cd74730a1219c26c7b44130db5770c23cd5f5/pdtransform-0.2.tar.gz" } ] }