Name | portia-pro JSON |
Version |
1.2.5
JSON |
| download |
home_page | https://github.com/yanjlee/portia |
Summary | Portia is a tool that allows you to visually scrape websites without any programming knowledge required. With Portia you can annotate a web page to identify the data you wish to extract, and Portia will understand based on these annotations how to scrape data from similar pages.. |
upload_time | 2024-06-01 08:10:36 |
maintainer | None |
docs_url | None |
author | yanjlee |
requires_python | None |
license | None |
keywords |
|
VCS |
|
bugtrack_url |
|
requirements |
No requirements were recorded.
|
Travis-CI |
|
coveralls test coverage |
No coveralls.
|
Portia
======
Portia is a tool that allows you to visually scrape websites without any programming knowledge required. With Portia you can annotate a web page to identify the data you wish to extract, and Portia will understand based on these annotations how to scrape data from similar pages.
# Running Portia
The easiest way to run Portia is using [Docker]:
You can run Portia using Docker & official Portia-image by running:
docker run -v ~/portia_projects:/app/data/projects:rw -p 9001:9001 scrapinghub/portia
You can also set up a local instance with [Docker-compose] by cloning this repo & running from the root of the folder:
docker-compose up
For more detailed instructions, and alternatives to using Docker, see the [Installation] docs.
# Documentation
Documentation can be found from [Read the docs]. Source files can be found in the ``docs`` directory.
[Docker]: https://www.docker.com/
[Docker-compose]:https://docs.docker.com/compose
[Installation]: http://portia.readthedocs.org/en/latest/installation.html
[Read the docs]: http://portia.readthedocs.org/en/latest/index.html
[Scrapinghub]: https://portia.scrapinghub.com/
Raw data
{
"_id": null,
"home_page": "https://github.com/yanjlee/portia",
"name": "portia-pro",
"maintainer": null,
"docs_url": null,
"requires_python": null,
"maintainer_email": null,
"keywords": null,
"author": "yanjlee",
"author_email": "yanjlee@163.com",
"download_url": "https://files.pythonhosted.org/packages/c6/98/78fa411b2b541587b15abb909236f9f6482d7abed370c99b342135f7b621/portia_pro-1.2.5.tar.gz",
"platform": null,
"description": "Portia\r\n======\r\n\r\nPortia is a tool that allows you to visually scrape websites without any programming knowledge required. With Portia you can annotate a web page to identify the data you wish to extract, and Portia will understand based on these annotations how to scrape data from similar pages.\r\n\r\n# Running Portia\r\n\r\nThe easiest way to run Portia is using [Docker]:\r\n\r\nYou can run Portia using Docker & official Portia-image by running:\r\n\r\n docker run -v ~/portia_projects:/app/data/projects:rw -p 9001:9001 scrapinghub/portia\r\n\r\nYou can also set up a local instance with [Docker-compose] by cloning this repo & running from the root of the folder:\r\n\r\n docker-compose up\r\n\r\nFor more detailed instructions, and alternatives to using Docker, see the [Installation] docs.\r\n\r\n# Documentation\r\n\r\nDocumentation can be found from [Read the docs]. Source files can be found in the ``docs`` directory.\r\n\r\n[Docker]: https://www.docker.com/\r\n[Docker-compose]:https://docs.docker.com/compose\r\n[Installation]: http://portia.readthedocs.org/en/latest/installation.html\r\n[Read the docs]: http://portia.readthedocs.org/en/latest/index.html\r\n[Scrapinghub]: https://portia.scrapinghub.com/\r\n",
"bugtrack_url": null,
"license": null,
"summary": "Portia is a tool that allows you to visually scrape websites without any programming knowledge required. With Portia you can annotate a web page to identify the data you wish to extract, and Portia will understand based on these annotations how to scrape data from similar pages..",
"version": "1.2.5",
"project_urls": {
"Homepage": "https://github.com/yanjlee/portia"
},
"split_keywords": [],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "93c78ca8ad04607dd057cc3047387f99abc4a657b3b45eda4631c7e1e0926150",
"md5": "f7a37552328ec6212cc6efcf799a1de9",
"sha256": "fdc10f5bc19e84c4c8d91757d04dfa9de1328dfb530ec022bc7fb59dd7cfd584"
},
"downloads": -1,
"filename": "portia_pro-1.2.5-py3-none-any.whl",
"has_sig": false,
"md5_digest": "f7a37552328ec6212cc6efcf799a1de9",
"packagetype": "bdist_wheel",
"python_version": "py3",
"requires_python": null,
"size": 2914,
"upload_time": "2024-06-01T08:10:34",
"upload_time_iso_8601": "2024-06-01T08:10:34.298476Z",
"url": "https://files.pythonhosted.org/packages/93/c7/8ca8ad04607dd057cc3047387f99abc4a657b3b45eda4631c7e1e0926150/portia_pro-1.2.5-py3-none-any.whl",
"yanked": false,
"yanked_reason": null
},
{
"comment_text": "",
"digests": {
"blake2b_256": "c69878fa411b2b541587b15abb909236f9f6482d7abed370c99b342135f7b621",
"md5": "b5c5fcf01286fddf517a81decc288cf6",
"sha256": "1500782358d91d1ec568a26e383708d1ce6e86359beaea7f1d8360f209e06482"
},
"downloads": -1,
"filename": "portia_pro-1.2.5.tar.gz",
"has_sig": false,
"md5_digest": "b5c5fcf01286fddf517a81decc288cf6",
"packagetype": "sdist",
"python_version": "source",
"requires_python": null,
"size": 3568,
"upload_time": "2024-06-01T08:10:36",
"upload_time_iso_8601": "2024-06-01T08:10:36.032425Z",
"url": "https://files.pythonhosted.org/packages/c6/98/78fa411b2b541587b15abb909236f9f6482d7abed370c99b342135f7b621/portia_pro-1.2.5.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2024-06-01 08:10:36",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "yanjlee",
"github_project": "portia",
"travis_ci": true,
"coveralls": false,
"github_actions": false,
"lcname": "portia-pro"
}