-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathmain.py
26 lines (21 loc) · 775 Bytes
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from src.company_info_downloader import download_info_companies, read_companies_info
from src.crawler import write_json_from_data
companiesWebsites = {
"SIEMENS": [
"https://www.siemens-energy.com/us/en/home/products-services.html",
"/products-services/",
],
"HITACHI": [
"https://www.hitachienergy.com/products-and-solutions/",
"/products-and-solutions/",
],
}
if __name__ == "__main__":
infoDict = download_info_companies(
companiesWebsites=companiesWebsites, numPagesToDownload=500, method="functional"
)
resultFileName = "companies_info.json"
write_json_from_data(infoDict, resultFileName)
data = read_companies_info(
resultFileName
) # testing the function, returning nothing