{ "info": { "author": "Max Woolf", "author_email": "max@minimaxir.com", "bugtrack_url": null, "classifiers": [], "description": "\nGive an input CSV file and a target field you want to predict to automl-gs, and get a trained high-performing machine learning or deep learning model plus native code pipelines allowing you to integrate that model into any prediction workflow. No black box: you can see *exactly* how the data is processed, how the model is constructed, and you can make tweaks as necessary.\n\nautoml-gs is an AutoML tool which, unlike Microsoft's [NNI](https://github.com/Microsoft/nni), Uber's [Ludwig](https://github.com/uber/ludwig), and [TPOT](https://github.com/EpistasisLab/tpot), offers a *zero code/model definition interface* to getting an optimized model and data transformation pipeline in multiple popular ML/DL frameworks, with minimal Python dependencies (pandas + scikit-learn + your framework of choice). automl-gs is designed for citizen data scientists and engineers without a deep statistical background under the philosophy that you don't need to know any modern data preprocessing and machine learning engineering techniques to create a powerful prediction workflow.\n\nNowadays, the cost of computing many different models and hyperparameters is much lower than the oppertunity cost of an data scientist's time. automl-gs is a Python 3 module designed to abstract away the common approaches to transforming tabular data, architecting machine learning/deep learning models, and performing random hyperparameter searches to identify the best-performing model. This allows data scientists and researchers to better utilize their time on model performance optimization.\n\n* Generates native Python code; no platform lock-in, and no need to use automl-gs after the model script is created.\n* Train model configurations super-fast *for free* using a **TPU** in Google Colaboratory.\n* Handles messy datasets that normally require manual intervention, such as datetime/categorical encoding and spaced/parathesized column names.\n* Each part of the generated model pipeline is its own function w/ docstrings, making it much easier to integrate into production workflows.\n* Extremely detailed metrics reporting for every trial stored in a tidy CSV, allowing you to identify and visualize model strengths and weaknesses.\n* Correct serialization of data pipeline encoders on disk (i.e. no pickled Python objects!)\n* Retrain the generated model on new data without making any code/pipeline changes.\n* Quit the hyperparameter search at any time, as the results are saved after each trial.\n\nThe models generated by automl-gs are intended to give a very strong *baseline* for solving a given problem; they're not the end-all-be-all that often accompanies the AutoML hype, but the resulting code is easily tweakable to improve from the baseline.\n", "description_content_type": "", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/minimaxir/automl-gs", "keywords": "deep learning", "license": "MIT", "maintainer": "", "maintainer_email": "", "name": "automl_gs", "package_url": "https://pypi.org/project/automl_gs/", "platform": "", "project_url": "https://pypi.org/project/automl_gs/", "project_urls": { "Homepage": "https://github.com/minimaxir/automl-gs" }, "release_url": "https://pypi.org/project/automl_gs/0.2.1/", "requires_dist": null, "requires_python": "", "summary": "Provide an input CSV and a target field to predict, generate a model + code to run it.", "version": "0.2.1" }, "last_serial": 5102314, "releases": { "0.2": [ { "comment_text": "", "digests": { "md5": "cb298b4568b03f980ba952e18d206954", "sha256": "a74d44bba154462ce510884ee58adf93d0de665433535cbf30890dddd6096c0b" }, "downloads": -1, "filename": "automl_gs-0.2.tar.gz", "has_sig": false, "md5_digest": "cb298b4568b03f980ba952e18d206954", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 26894, "upload_time": "2019-03-26T05:44:54", "url": "https://files.pythonhosted.org/packages/8f/21/da79be042ce5ac74ec6e056ac2b3715365beef2958a8ca420b2b89e58fb6/automl_gs-0.2.tar.gz" } ], "0.2.1": [ { "comment_text": "", "digests": { "md5": "ba9089591bd731e72be16dbfc5382673", "sha256": "51c4b68e5bdda99fa42643a382760da765118daf44bbddb6b344317c5fa36c3a" }, "downloads": -1, "filename": "automl_gs-0.2.1.tar.gz", "has_sig": false, "md5_digest": "ba9089591bd731e72be16dbfc5382673", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 27236, "upload_time": "2019-04-05T06:47:54", "url": "https://files.pythonhosted.org/packages/c4/51/27833a08fe4f83711b09836ddd9128e275a6900c47e0e5782112ed611484/automl_gs-0.2.1.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "ba9089591bd731e72be16dbfc5382673", "sha256": "51c4b68e5bdda99fa42643a382760da765118daf44bbddb6b344317c5fa36c3a" }, "downloads": -1, "filename": "automl_gs-0.2.1.tar.gz", "has_sig": false, "md5_digest": "ba9089591bd731e72be16dbfc5382673", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 27236, "upload_time": "2019-04-05T06:47:54", "url": "https://files.pythonhosted.org/packages/c4/51/27833a08fe4f83711b09836ddd9128e275a6900c47e0e5782112ed611484/automl_gs-0.2.1.tar.gz" } ] }