Extract emails and linkedins profiles from a given website
Support the project with BTC: bc1q0cxl5j3se0ufhr96h8x0zs8nz4t7h6krrxkd6l
- Python >= 3.7
pip install extract_emails
from extract_emails.browsers.requests_browser import RequestsBrowser as Browser
from extract_emails import DefaultFilterAndEmailFactory as Factory
from extract_emails import DefaultWorker
browser = Browser()
url = 'https://en.wikipedia.org/'
factory = Factory(website_url=url, browser=browser)
worker = DefaultWorker(factory)
data = worker.get_data()
print(data)
"""
[
PageData(
website='https://en.wikipedia.org/',
page_url='https://en.wikipedia.org/Email_address',
data={'email': ['"John.Doe."@example.com', 'x@example.com']}
),
PageData(
website='https://en.wikipedia.org/',
page_url='https://en.wikipedia.org/Email_address2',
data={'email': ['"John.Doe2."@example.com', 'x2@example.com']}
),
]
"""
$ extract-emails --help
$ extract-emails --url https://en.wikipedia.org/wiki/Email -of output.csv -d 1
$ cat output.csv
email,page,website
bob@b.org,https://en.wikipedia.org/wiki/Email,https://en.wikipedia.org/wiki/Email