pip install zacktools
or from git
pip3 install git+https://github.com/ZackAnalysis/zacktools.git
A tool for parse address,phone, email, facebook, twitter, linkedin, contact link, about us link from a webpage
from zacktools import pageparser
import requests
res = requests.get('http://rel8ed.to')
result = pageparser.parse(res.content)
print(result)
{
"facebook": "https://www.facebook.com/rel8edto/",
"twitter": "https://twitter.com/rel8edto",
"instagram": "",
"linkedin": "https://www.linkedin.com/company/rel8ed-to",
"contactlink": "http://www.rel8ed.to/contact-us/",
"aboutlink": "http://www.rel8ed.to/about-us/",
"title": "Big Data Analysis Data Mining Predictive Analytics",
"email": "[email protected]",
"phone": "905.321.0466",
"Mainaddress": "1 St. Paul St., Unit A303, St. Catharines, ON L2R 7L2",
"addresses": [
"1 St. Paul St., Unit A303, St. Catharines, ON L2R 7L2"
]
}
from zacktools.multiThread import scrapeurls
import asyncio
urls = ['ibm.com','idc.com']
asyncio.run(scrapeurls(urls))