{ "info": { "author": "zhaobin", "author_email": "303844828@qq.com", "bugtrack_url": null, "classifiers": [], "description": "Introduction\n------------\n\nxgboost for pyspark\n\npython3.5 spark2.4.x xgboost0.9\n\npython install\n--------------\n\npip install PyXGBoost\n\ncode examples:\n--------------\n\n.. code:: python\n\n from pyspark.sql import SparkSession\n from PyXGBoost import PyXGBoostClassifier, PyXGBoostClassificationModel\n spark = SparkSession \\\n .builder \\\n .appName(\"pyspark xgboost\") \\\n .getOrCreate()\n\n df=spark.read.csv(\"src/main/resources/iris.csv\",schema=\"sepal_length double, sepal_width double, petal_length double,petal_width double,label int\")\n df=df.fillna(0)\n #same as xgboost param map\n params0 = {\n \"objective\" :\"binary:logistic\"\n , \"eta\" : 0.01\n , \"max_depth\" : 6\n , \"min_child_weight\" : 50\n , \"colsample_bytree\" : 0.5\n , \"silent\" : 0\n , \"seed\" : 12345\n }\n\n xgb=PyXGBoostClassifier(params0)\n\n xgb.set_num_round(11) \\\n .set_num_workers(11)\n \n feature_names=[\"sepal_length\",\"sepal_width\",\"petal_length\",\"petal_width\"]\n xgbModel=xgb.train(df,feature_names, \"label\")\n xgbModel.saveOverwrite(\"hdfs://xxxx\")\n #xgbModel.write().overwrite().save(\"hdfs://xxxx\")\n xgbModel=PyXGBoostClassificationModel.load(\"hdfs://xxxx\")\n result_df=xgbModel.transform(df,feature_names)\n\ndownload jar\n------------\n\nhttps://github.com/303844828/PyXGBoost/blob/master/src/main/build/pyspark-xgboost-1.0-SNAPSHOT.jar\n\nsubmit\n------\n\n.. code:: shell\n\n spark-submit --master yarn-cluster --num-executors 100 \\\n --jars pyspark-xgboost-1.0-SNAPSHOT.jar \\\n --py-files pyspark-xgboost-1.0-SNAPSHOT.jar \\\n --files test.py\n\n\u7b80\u4ecb\n----\n\npyspark\u7248\u672c\u7684xgboost\n\n\u9996\u5148\u6267\u884c\uff1a\n----------\n\npip install PyXGBoost\n\n\u4ee3\u7801\u793a\u4f8b\uff1a\n----------\n\n.. code:: python\n\n from pyspark.sql import SparkSession\n from PyXGBoost import PyXGBoostClassifier, PyXGBoostClassificationModel\n spark = SparkSession \\\n .builder \\\n .appName(\"pyspark xgboost\") \\\n .getOrCreate()\n\n df=spark.read.csv(\"src/main/resources/iris.csv\",schema=\"sepal_length double, sepal_width double, petal_length double,petal_width double,label int\")\n df=df.fillna(0)\n #same as xgboost param map\n params0 = {\n \"objective\" :\"binary:logistic\"\n , \"eta\" : 0.01\n , \"max_depth\" : 6\n , \"min_child_weight\" : 50\n , \"colsample_bytree\" : 0.5\n , \"silent\" : 0\n , \"seed\" : 12345\n }\n\n xgb=PyXGBoostClassifier(params0)\n\n xgb.set_num_round(11) \\\n .set_num_workers(11)\n \n feature_names=[\"sepal_length\",\"sepal_width\",\"petal_length\",\"petal_width\"]\n xgbModel=xgb.train(df,feature_names, \"label\")\n xgbModel.saveOverwrite(\"hdfs://xxxx\")\n #xgbModel.write().overwrite().save(\"hdfs://xxxx\")\n xgbModel=PyXGBoostClassificationModel.load(\"hdfs://xxxx\")\n result_df=xgbModel.transform(df,feature_names)\n\n\u63d0\u4ea4\n----\n\n\u547d\u4ee4\u9700\u8981\u5728\u4e24\u4e2a\u5730\u65b9\u5e26\u4e0ajar\u5305\uff0c\u793a\u4f8b\uff1a\n\n.. code:: shell\n\n spark-submit --master yarn-cluster --num-executors 100 \\\n --jars pyspark-xgboost-1.0-SNAPSHOT.jar \\\n --py-files pyspark-xgboost-1.0-SNAPSHOT.jar \\\n --files test.py", "description_content_type": "", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "", "keywords": "", "license": "", "maintainer": "", "maintainer_email": "", "name": "PyXGBoost", "package_url": "https://pypi.org/project/PyXGBoost/", "platform": "", "project_url": "https://pypi.org/project/PyXGBoost/", "project_urls": null, "release_url": "https://pypi.org/project/PyXGBoost/1.0.9/", "requires_dist": null, "requires_python": "", "summary": "pyXgboost,github:https://github.com/303844828/PyXGBoost.git", "version": "1.0.9", "yanked": false, "yanked_reason": null }, "last_serial": 6010162, "releases": { "1.0": [ { "comment_text": "", "digests": { "md5": "2446017c5b06e792402e2de79f4db5da", "sha256": "7222e338a81d6beb87adfac0b08ed80f80c709d8ff85a8c002c59e428cbbffcd" }, "downloads": -1, "filename": "PyXGBoost-1.0.tar.gz", "has_sig": false, "md5_digest": "2446017c5b06e792402e2de79f4db5da", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 1723, "upload_time": "2019-10-21T06:08:00", "upload_time_iso_8601": "2019-10-21T06:08:00.890437Z", "url": "https://files.pythonhosted.org/packages/20/4d/72ea2ad735dff0afb071b77a2a4dd85b9eca57b868d26a2a33c4b79b6294/PyXGBoost-1.0.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.1": [ { "comment_text": "", "digests": { "md5": "d440c7a5a1f10beeb8f7f0a0393be13f", "sha256": "ff8dfcba4968aa352b01c44d4f89dfa963e3664c340a18f57eb2b2581ec2b1fb" }, "downloads": -1, "filename": "PyXGBoost-1.0.1.tar.gz", "has_sig": false, "md5_digest": "d440c7a5a1f10beeb8f7f0a0393be13f", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 1752, "upload_time": "2019-10-21T09:21:43", "upload_time_iso_8601": "2019-10-21T09:21:43.843057Z", "url": "https://files.pythonhosted.org/packages/86/b2/cf27a6cf10305d19cf031c1c7141bff82139deca0a709e46ab0b561c4efd/PyXGBoost-1.0.1.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.3": [ { "comment_text": "", "digests": { "md5": "f674169579612ee30d12034b59da4a3b", "sha256": "f78dca4856688ecb28bb0d2a67fc54a2d1f0f5abe903d2606f989955df9fdefc" }, "downloads": -1, "filename": "PyXGBoost-1.0.3.tar.gz", "has_sig": false, "md5_digest": "f674169579612ee30d12034b59da4a3b", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2830, "upload_time": "2019-10-21T09:40:39", "upload_time_iso_8601": "2019-10-21T09:40:39.669809Z", "url": "https://files.pythonhosted.org/packages/99/5a/068695ce07b0b1fac3a249db533d060de99367f6915e6e5bfb684b5d4da6/PyXGBoost-1.0.3.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.5": [ { "comment_text": "", "digests": { "md5": "eeb7fd56c546f718eaf70ecee63d2a6e", "sha256": "dfc35bf64c70ca543bdad37a0c3aa4d3109bf50ade494e7166e12ed0a4a25afc" }, "downloads": -1, "filename": "PyXGBoost-1.0.5.tar.gz", "has_sig": false, "md5_digest": "eeb7fd56c546f718eaf70ecee63d2a6e", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2846, "upload_time": "2019-10-21T14:38:57", "upload_time_iso_8601": "2019-10-21T14:38:57.513682Z", "url": "https://files.pythonhosted.org/packages/0a/4b/448b2315586cd47c372d46bf04e56929a9a4c936fc4979fad448360b454a/PyXGBoost-1.0.5.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.6": [ { "comment_text": "", "digests": { "md5": "a7593c699bdfa22cbd688baf0774072c", "sha256": "c22d5aee4112ea9d2dffd76058284baae7d1c3c33d95142361062d005fa5a892" }, "downloads": -1, "filename": "PyXGBoost-1.0.6.tar.gz", "has_sig": false, "md5_digest": "a7593c699bdfa22cbd688baf0774072c", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2843, "upload_time": "2019-10-21T14:43:09", "upload_time_iso_8601": "2019-10-21T14:43:09.324983Z", "url": "https://files.pythonhosted.org/packages/66/64/5687e98766d3159f35cd522bfdd3cfbc87e8a8075d6ce6230062886891fb/PyXGBoost-1.0.6.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.7": [ { "comment_text": "", "digests": { "md5": "2a112e46f9bc32fe9f7921e0dda5b8fe", "sha256": "577e834726d132b8e4879a6afcb29d9cde8b35705e24746a5af0a9c89ab919db" }, "downloads": -1, "filename": "PyXGBoost-1.0.7.tar.gz", "has_sig": false, "md5_digest": "2a112e46f9bc32fe9f7921e0dda5b8fe", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2844, "upload_time": "2019-10-21T14:44:14", "upload_time_iso_8601": "2019-10-21T14:44:14.382643Z", "url": "https://files.pythonhosted.org/packages/56/0d/b757f119cef7e6f7b45b419b6677df3a329ca2b80de7916eb593b175d9bb/PyXGBoost-1.0.7.tar.gz", "yanked": false, "yanked_reason": null } ], "1.0.9": [ { "comment_text": "", "digests": { "md5": "707bb115dba130322888969f09492d35", "sha256": "6dae7802cd9c9e10685b83be9c873edcf8c698957da029c7a306c1d0f2901d5c" }, "downloads": -1, "filename": "PyXGBoost-1.0.9.tar.gz", "has_sig": false, "md5_digest": "707bb115dba130322888969f09492d35", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2874, "upload_time": "2019-10-22T02:18:48", "upload_time_iso_8601": "2019-10-22T02:18:48.523374Z", "url": "https://files.pythonhosted.org/packages/1e/8b/74902abb027a6ffb43a7483ed803d7ab8438497e6df9012ccca8a42b942f/PyXGBoost-1.0.9.tar.gz", "yanked": false, "yanked_reason": null } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "707bb115dba130322888969f09492d35", "sha256": "6dae7802cd9c9e10685b83be9c873edcf8c698957da029c7a306c1d0f2901d5c" }, "downloads": -1, "filename": "PyXGBoost-1.0.9.tar.gz", "has_sig": false, "md5_digest": "707bb115dba130322888969f09492d35", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 2874, "upload_time": "2019-10-22T02:18:48", "upload_time_iso_8601": "2019-10-22T02:18:48.523374Z", "url": "https://files.pythonhosted.org/packages/1e/8b/74902abb027a6ffb43a7483ed803d7ab8438497e6df9012ccca8a42b942f/PyXGBoost-1.0.9.tar.gz", "yanked": false, "yanked_reason": null } ], "vulnerabilities": [] }