spoof-detect / python /vendor.py
Niv Sardi
vendor: add arguments
dd9165a
#!/usr/bin/env python3
import csv
import concurrent.futures
import requests
from progress.bar import ChargingBar
from entity import Entity
from common import defaults,mkdir
import screenshot
import web
PARALLEL = 20
def query_vendor_site(e: Entity):
fn = web.get_cert(e)
lfn = web.get_logos(e)
sfn = screenshot.sc_entity(e)
return (fn, lfn, sfn)
def from_csv(fn: str, n_workers = PARALLEL):
with open(fn, newline='') as csvfile:
reader = csv.DictReader(csvfile)
with concurrent.futures.ThreadPoolExecutor(max_workers = n_workers) as executor:
futures = {executor.submit(query_vendor_site, e): e for e in [Entity.from_dict(d) for d in reader]}
bar = ChargingBar('Processing', max=len(futures))
for f in concurrent.futures.as_completed(futures):
url = futures[f]
try:
(cert, logos) = f.result()
except Exception as exc:
print('%r generated an exception: %s' % (url, exc))
raise
else:
print(cert, logos)
bar.next()
bar.finish()
#query_vendor_site(Entity.from_dict({'url':'http://www.bancoprovincia.com.ar', 'bco':'debug'}))
#exit()
if __name__ == '__main__':
import argparse
parser = argparse.ArgumentParser(description='extract certificates and screenshots websites')
parser.add_argument('--csv', metavar='csv', type=str,
default=defaults.MAIN_CSV_PATH,
help='main database')
parser.add_argument('--parallel', metavar='parallel', type=int,
default=PARALLEL,
help='number of concurrent jobs')
args = parser.parse_args()
from_csv(args.csv)