{ "info": { "author": "Philippe ENTZMANN", "author_email": "philippe@phec.net", "bugtrack_url": null, "classifiers": [ "License :: OSI Approved :: BSD License", "Programming Language :: Python :: 3", "Programming Language :: Python :: 3.7" ], "description": "**WARNING : DON'T EXPECT SOMETHING USEFULL FROM THIS TOOL AT THIS STAGE !!**\n\n# xlscrap\n\nxlscrap is a [MIT-licensed](https://opensource.org/licenses/BSD-3-Clause) package to ease Excel files mass data extraction\n\nSee the [documentation](docs/index.md).\n\n# Rationale\n\nHave you ever feel the pain of extracting data from a lot of Excel files ?\n\n* When you have hundreds or thousands file that look similar\nbut differ in slighty annoying details.\n* When data cells coordinates can't be used because they change\n* When you have to spot dozens or hundreds fields with different strategies.\n* When the same field moves in different sheet position or name\n* When the same field label changes\n* When the data cell is on the right of the label or below the label\n* When you need to check that the collected data is correct.\n\nxlscrap helps you to scrap data out of your Excel files.\n\n# Quickstart\n\n```python\n>>> import xlscrap\n>>> s = xlscrap.Scrapper()\n>>> s.field('name')\n>>> s.field('age')\n>>> s.field('address')\n>>> s.table('pets', fields=['name', 'breed', 'age'])\n>>> s.scrap('excel-files/*.xls*')\nlooking for 4 fields in 5 files in excel-files/*.xls*,\nfile 1/5, found 4/4 fields in diana.xlsx\nfile 2/5, found 4/4 fields in bob.xls\nfile 3/5, found 3/4 fields in richard.ods\nfile 4/5, found 0/4 fields in alien.xls\nfile 5/5, found 4/4 fields in maria.xlsm\n>>> s.result\n[\n {'name': 'Diana',\n 'age': 47,\n 'address': '44 rue du Louvre\\n75000 Paris\\nFrance'\n 'pets': []},\n ...\n]\n```\n\n# TODO\n\n* set gitlab URL in setup.py\n* clone gitlab/github\n* complete quickstart in README\n ", "description_content_type": "text/markdown", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "", "keywords": "spreadsheet,poetry", "license": "BSD-3-Clause", "maintainer": "Philippe ENTZMANN", "maintainer_email": "philippe@phec.net", "name": "xlscrap", "package_url": "https://pypi.org/project/xlscrap/", "platform": "", "project_url": "https://pypi.org/project/xlscrap/", "project_urls": null, "release_url": "https://pypi.org/project/xlscrap/0.1.0/", "requires_dist": [ "openpyxl (>=2.6,<3.0)" ], "requires_python": ">=3.7,<4.0", "summary": "A package to ease Excel files mass data extraction", "version": "0.1.0" }, "last_serial": 5568272, "releases": { "0.1.0": [ { "comment_text": "", "digests": { "md5": "f9dada4d777f760f9abf7573c0db6b07", "sha256": "ddd808d65f5888abd0b60aa4915180e2719308ed89e5333d9131228688c27546" }, "downloads": -1, "filename": "xlscrap-0.1.0-py3-none-any.whl", "has_sig": false, "md5_digest": "f9dada4d777f760f9abf7573c0db6b07", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": ">=3.7,<4.0", "size": 3444, "upload_time": "2019-07-22T17:01:27", "url": "https://files.pythonhosted.org/packages/78/16/bcce98e1c8b34b6036c5b34221ea97b4e4dd07234513328dd8079aa65fcb/xlscrap-0.1.0-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "0444d671b5ff3c34710fb22103f93800", "sha256": "e7160fa2160c1ca165423cbdb5f1fb73e42febf82fa85ec6f59bb169905b39c8" }, "downloads": -1, "filename": "xlscrap-0.1.0.tar.gz", "has_sig": false, "md5_digest": "0444d671b5ff3c34710fb22103f93800", "packagetype": "sdist", "python_version": "source", "requires_python": ">=3.7,<4.0", "size": 3386, "upload_time": "2019-07-22T17:01:30", "url": "https://files.pythonhosted.org/packages/fe/04/d2a62b59f7a2a2584414a80578674fc92e5a2ef1b9199a57e244c07957aa/xlscrap-0.1.0.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "f9dada4d777f760f9abf7573c0db6b07", "sha256": "ddd808d65f5888abd0b60aa4915180e2719308ed89e5333d9131228688c27546" }, "downloads": -1, "filename": "xlscrap-0.1.0-py3-none-any.whl", "has_sig": false, "md5_digest": "f9dada4d777f760f9abf7573c0db6b07", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": ">=3.7,<4.0", "size": 3444, "upload_time": "2019-07-22T17:01:27", "url": "https://files.pythonhosted.org/packages/78/16/bcce98e1c8b34b6036c5b34221ea97b4e4dd07234513328dd8079aa65fcb/xlscrap-0.1.0-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "0444d671b5ff3c34710fb22103f93800", "sha256": "e7160fa2160c1ca165423cbdb5f1fb73e42febf82fa85ec6f59bb169905b39c8" }, "downloads": -1, "filename": "xlscrap-0.1.0.tar.gz", "has_sig": false, "md5_digest": "0444d671b5ff3c34710fb22103f93800", "packagetype": "sdist", "python_version": "source", "requires_python": ">=3.7,<4.0", "size": 3386, "upload_time": "2019-07-22T17:01:30", "url": "https://files.pythonhosted.org/packages/fe/04/d2a62b59f7a2a2584414a80578674fc92e5a2ef1b9199a57e244c07957aa/xlscrap-0.1.0.tar.gz" } ] }