####################################################
Python Module for Scraping Email Addresses from HTML
####################################################
The `email_scraper` module provides a simple method that extracts email addresses from HTML. It is able to find emails
in plain text, links, `atob()` obfuscation and HTML entities obfuscation.
Available on PyPI_.
.. _PyPI: https://pypi.org/pypi/email-scraper/
.. image:: https://github.com/kichik/email-scraper/workflows/Build/badge.svg
:target: https://github.com/kichik/email-scraper/actions
.. image:: https://badge.fury.io/py/email-scraper.svg
:target: https://badge.fury.io/py/email-scraper
Usage
-----
>>> from email_scraper import scrape_emails
>>> scrape_emails('<html><body><a href="mailto:hello@world.com">email me</a></body></html>')
{'hello@world.com'}
>>> scarpe_emails('<a href="javascript:window.location.href=atob(\'bWFpbHRvOmVtYWlsQGV4YW1wbGUuY29t\')">E-Mail</a>')
{'email@example.com'}
Raw data
{
"_id": null,
"home_page": "https://github.com/kichik/email-scraper",
"name": "email-scraper",
"maintainer": "",
"docs_url": null,
"requires_python": "",
"maintainer_email": "",
"keywords": "email scraping web obfuscate",
"author": "Amir Szekely",
"author_email": "kichik@gmail.com",
"download_url": "https://files.pythonhosted.org/packages/71/f3/78e745c325dcb4a46042ed91a9305b560dbb0c63ca171823d99e25306c99/email-scraper-0.5.tar.gz",
"platform": null,
"description": "####################################################\nPython Module for Scraping Email Addresses from HTML\n####################################################\n\nThe `email_scraper` module provides a simple method that extracts email addresses from HTML. It is able to find emails\nin plain text, links, `atob()` obfuscation and HTML entities obfuscation.\n\nAvailable on PyPI_.\n\n.. _PyPI: https://pypi.org/pypi/email-scraper/\n\n.. image:: https://github.com/kichik/email-scraper/workflows/Build/badge.svg\n :target: https://github.com/kichik/email-scraper/actions\n\n.. image:: https://badge.fury.io/py/email-scraper.svg\n :target: https://badge.fury.io/py/email-scraper\n\nUsage\n-----\n\n >>> from email_scraper import scrape_emails\n >>> scrape_emails('<html><body><a href=\"mailto:hello@world.com\">email me</a></body></html>')\n {'hello@world.com'}\n >>> scarpe_emails('<a href=\"javascript:window.location.href=atob(\\'bWFpbHRvOmVtYWlsQGV4YW1wbGUuY29t\\')\">E-Mail</a>')\n {'email@example.com'}\n\n\n",
"bugtrack_url": null,
"license": "MIT",
"summary": "Simple utility to extract email addresses from HTML, including obfuscated email addresses",
"version": "0.5",
"project_urls": {
"Homepage": "https://github.com/kichik/email-scraper"
},
"split_keywords": [
"email",
"scraping",
"web",
"obfuscate"
],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "78d6efbffc6c90423f1e36cd5d73a4bb2f3575b049a8cb98cc7ae2d26422c111",
"md5": "18c43e27cb19493424597451b124c6e0",
"sha256": "a479f210e460795ef5405f31abfc42a1282297ff3816a021ce63b72f432949ce"
},
"downloads": -1,
"filename": "email_scraper-0.5-py2.py3-none-any.whl",
"has_sig": false,
"md5_digest": "18c43e27cb19493424597451b124c6e0",
"packagetype": "bdist_wheel",
"python_version": "py2.py3",
"requires_python": null,
"size": 4023,
"upload_time": "2024-02-29T03:29:41",
"upload_time_iso_8601": "2024-02-29T03:29:41.799062Z",
"url": "https://files.pythonhosted.org/packages/78/d6/efbffc6c90423f1e36cd5d73a4bb2f3575b049a8cb98cc7ae2d26422c111/email_scraper-0.5-py2.py3-none-any.whl",
"yanked": false,
"yanked_reason": null
},
{
"comment_text": "",
"digests": {
"blake2b_256": "71f378e745c325dcb4a46042ed91a9305b560dbb0c63ca171823d99e25306c99",
"md5": "602909738a6195ae14bd2b5fc83f5e18",
"sha256": "7633268c22a98f3419d19626fa3f086b14bd990f8ba3449ad8cd8ebd1853617a"
},
"downloads": -1,
"filename": "email-scraper-0.5.tar.gz",
"has_sig": false,
"md5_digest": "602909738a6195ae14bd2b5fc83f5e18",
"packagetype": "sdist",
"python_version": "source",
"requires_python": null,
"size": 2791,
"upload_time": "2024-02-29T03:29:43",
"upload_time_iso_8601": "2024-02-29T03:29:43.282649Z",
"url": "https://files.pythonhosted.org/packages/71/f3/78e745c325dcb4a46042ed91a9305b560dbb0c63ca171823d99e25306c99/email-scraper-0.5.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2024-02-29 03:29:43",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "kichik",
"github_project": "email-scraper",
"travis_ci": false,
"coveralls": false,
"github_actions": true,
"lcname": "email-scraper"
}