theHarvester/theHarvester.py

931 lines
40 KiB
Python
Raw Normal View History

2019-01-06 13:14:46 +08:00
#!/usr/bin/env python3
2011-05-04 23:07:06 +08:00
from discovery import *
from discovery.constants import *
from lib.core import *
from lib import hostchecker
from lib import htmlExport
2018-12-30 10:29:25 +08:00
from lib import reportgraph
from lib import statichtmlgenerator
2019-01-11 10:09:47 +08:00
import datetime
import getopt
import re
import stash
import time
try:
2018-12-27 15:43:32 +08:00
import bs4
2018-12-30 10:29:25 +08:00
except ImportError:
2019-01-11 10:09:47 +08:00
print("\n\033[93m[!] BeautifulSoup library not found, please install before proceeding.\n\n \033[0m")
2018-12-27 15:53:12 +08:00
sys.exit(1)
2018-12-16 11:07:37 +08:00
2018-11-30 05:28:37 +08:00
try:
2018-12-27 15:43:32 +08:00
import requests
2018-12-30 10:29:25 +08:00
except ImportError:
2019-01-11 10:09:47 +08:00
print("\n\033[93m[!] Requests library not found, please install before proceeding.\n\n \033[0m")
2018-12-27 15:53:12 +08:00
sys.exit(1)
Core.banner()
2011-05-04 23:07:06 +08:00
2018-12-30 10:29:25 +08:00
2011-05-04 23:07:06 +08:00
def start(argv):
if len(sys.argv) < 4:
Core.usage()
2018-12-27 15:43:32 +08:00
sys.exit(1)
try:
2018-11-11 22:24:58 +08:00
opts, args = getopt.getopt(argv, "l:d:b:s:u:vf:nhcgpte:")
except getopt.GetoptError:
Core.usage()
2018-12-27 15:43:32 +08:00
sys.exit(1)
2018-03-23 06:32:50 +08:00
try:
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
2018-03-23 06:32:50 +08:00
db.do_init()
2018-11-23 05:20:06 +08:00
except Exception as e:
2018-03-23 06:32:50 +08:00
pass
start = 0
host_ip = []
2018-12-18 07:14:42 +08:00
all_hosts = []
all_emails = []
filename = ""
bingapi = "yes"
dnslookup = False
dnsbrute = False
dnstld = False
shodan = False
vhost = []
virtual = False
ports_scanning = False
takeover_check = False
google_dorking = False
2018-03-23 06:32:50 +08:00
limit = 500
all_ip = []
2018-12-20 03:39:33 +08:00
full = []
trello_info = ([], False)
dnsserver = ""
2018-11-23 05:20:06 +08:00
for value in enumerate(opts):
opt = value[1][0]
arg = value[1][1]
opt = str(opt)
arg = str(arg)
if opt == '-l':
limit = int(arg)
elif opt == '-d':
word = arg
elif opt == '-g':
google_dorking = True
elif opt == '-s':
start = int(arg)
elif opt == '-v':
virtual = "basic"
elif opt == '-f':
filename = arg
elif opt == '-n':
dnslookup = True
elif opt == '-c':
dnsbrute = True
elif opt == '-h':
shodan = True
elif opt == '-e':
dnsserver = arg
elif opt == '-p':
ports_scanning = True
elif opt == '-t':
dnstld = True
elif opt == '-b':
engines = set(arg.split(','))
2019-01-11 10:09:47 +08:00
supportedengines = set(['baidu', 'bing', 'bingapi', 'censys', 'crtsh', 'cymon', 'dogpile', 'duckduckgo',
'google', 'googleCSE', 'google-certificates', 'google-profiles', 'hunter',
'linkedin', 'netcraft', 'pgp', 'securityTrails', 'threatcrowd', 'trello',
'twitter', 'vhost', 'virustotal', 'yahoo', 'all'])
if set(engines).issubset(supportedengines):
2019-01-11 10:09:47 +08:00
print(f"\033[94m[*] Target domain: {word} \n \033[0m")
for engineitem in engines:
2018-12-23 04:29:11 +08:00
if engineitem == "baidu":
print("\033[94m[*] Searching Baidu. \033[0m")
try:
search = baidusearch.SearchBaidu(word, limit)
search.process()
all_emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'baidu')
db.store_all(word, all_emails, 'email', 'baidu')
except Exception:
pass
2018-11-23 05:51:31 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "bing" or engineitem == "bingapi":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Bing. \033[0m")
try:
search = bingsearch.SearchBing(word, limit, start)
if engineitem == "bingapi":
bingapi = "yes"
else:
bingapi = "no"
search.process(bingapi)
all_emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'email', 'bing')
db.store_all(word, all_hosts, 'host', 'bing')
except Exception as e:
if isinstance(e, MissingKey):
print(e)
else:
pass
2018-12-16 11:07:37 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "censys":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Censys. \033[0m")
2018-12-23 04:29:11 +08:00
from discovery import censys
# Import locally or won't work
search = censys.SearchCensys(word, limit)
search.process()
2018-12-23 04:29:11 +08:00
all_ip = search.get_ipaddresses()
hosts = filter(search.get_hostnames())
2018-12-18 07:14:42 +08:00
all_hosts.extend(hosts)
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'censys')
db.store_all(word, all_ip, 'ip', 'censys')
2018-12-23 04:29:11 +08:00
elif engineitem == "crtsh":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching CRT.sh. \033[0m")
search = crtsh.search_crtsh(word)
search.process()
hosts = filter(search.get_hostnames())
2018-12-18 07:14:42 +08:00
all_hosts.extend(hosts)
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'CRTsh')
2018-12-23 04:29:11 +08:00
elif engineitem == "cymon":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Cymon. \033[0m")
2018-12-23 04:29:11 +08:00
from discovery import cymon
2018-12-27 15:43:32 +08:00
# Import locally or won't work.
2018-12-23 04:29:11 +08:00
search = cymon.search_cymon(word)
search.process()
2018-12-23 04:29:11 +08:00
all_ip = search.get_ipaddresses()
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_ip, 'ip', 'cymon')
elif engineitem == "dogpile":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Dogpile. \033[0m")
search = dogpilesearch.SearchDogpile(word, limit)
search.process()
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
all_emails.extend(emails)
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'email', 'dogpile')
db.store_all(word, all_hosts, 'host', 'dogpile')
elif engineitem == "duckduckgo":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching DuckDuckGo. \033[0m")
from discovery import duckduckgosearch
search = duckduckgosearch.SearchDuckDuckGo(word, limit)
search.process()
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
all_emails.extend(emails)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'email', 'duckduckgo')
db.store_all(word, all_hosts, 'host', 'duckduckgo')
2018-12-23 04:29:11 +08:00
elif engineitem == "google":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Google. \033[0m")
2018-12-23 04:29:11 +08:00
search = googlesearch.search_google(word, limit, start)
search.process(google_dorking)
emails = filter(search.get_emails())
all_emails.extend(emails)
hosts = filter(search.get_hostnames())
2018-12-18 07:14:42 +08:00
all_hosts.extend(hosts)
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'google')
db.store_all(word, all_emails, 'email', 'google')
2018-12-23 04:29:11 +08:00
elif engineitem == "googleCSE":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Google Custom Search. \033[0m")
try:
search = googleCSE.SearchGoogleCSE(
2019-01-05 00:28:11 +08:00
word, limit, start)
search.process()
search.store_results()
all_emails = filter(search.get_emails())
db = stash.stash_manager()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db.store_all(word, all_hosts, 'email', 'googleCSE')
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'googleCSE')
except Exception as e:
2019-01-11 10:09:47 +08:00
if isinstance(e, MissingKey):
print(e)
2019-01-11 10:09:47 +08:00
sys.exit(1)
else:
pass
2018-12-23 04:29:11 +08:00
elif engineitem == "google-certificates":
2019-01-11 10:09:47 +08:00
print("\033[94m[*] Searching Google Certificate transparency report. \033[0m")
search = googlecertificates.SearchGoogleCertificates(word, limit, start)
search.process()
hosts = filter(search.get_domains())
2018-12-23 04:29:11 +08:00
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'google-certificates')
elif engineitem == "google-profiles":
2019-01-11 10:09:47 +08:00
print("[*] Searching Google profiles.")
search = googlesearch.search_google(word, limit, start)
search.process_profiles()
people = search.get_profiles()
db = stash.stash_manager()
2018-12-20 03:39:33 +08:00
db.store_all(word, people, 'name', 'google-profile')
print("\nUsers from Google profiles:")
2018-11-23 05:20:06 +08:00
print("---------------------------")
for users in people:
2018-11-23 05:20:06 +08:00
print(users)
sys.exit()
2018-11-11 22:24:58 +08:00
elif engineitem == "hunter":
2019-01-11 10:09:47 +08:00
print("[*] Searching Hunter.")
2018-11-11 22:24:58 +08:00
from discovery import huntersearch
2018-12-27 15:53:12 +08:00
# Import locally or won't work.
try:
search = huntersearch.SearchHunter(word, limit, start)
search.process()
emails = filter(search.get_emails())
all_emails.extend(emails)
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'hunter')
db.store_all(word, all_emails, 'email', 'hunter')
except Exception as e:
if isinstance(e, MissingKey):
print(e)
else:
pass
2018-11-11 22:24:58 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "linkedin":
2019-01-11 10:09:47 +08:00
print("[*] Searching Linkedin.")
search = linkedinsearch.SearchLinkedin(word, limit)
2018-12-23 04:29:11 +08:00
search.process()
people = search.get_people()
db = stash.stash_manager()
db.store_all(word, people, 'name', 'linkedin')
print("\nUsers from Linkedin:")
2018-12-23 04:29:11 +08:00
print("-------------------")
for user in people:
print(user)
sys.exit()
elif engineitem == "netcraft":
2019-01-11 10:09:47 +08:00
print("[*] Searching Netcraft.")
search = netcraft.SearchNetcraft(word)
2018-12-01 04:57:12 +08:00
search.process()
hosts = filter(search.get_hostnames())
2018-12-18 07:14:42 +08:00
all_hosts.extend(hosts)
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'netcraft')
2018-12-20 03:39:33 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "pgp":
2019-01-11 10:09:47 +08:00
print("[*] Searching PGP key server.")
try:
search = pgpsearch.SearchPgp(word)
search.process()
all_emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'pgp')
db.store_all(word, all_emails, 'email', 'pgp')
except Exception:
pass
2018-12-23 04:29:11 +08:00
elif engineitem == 'securityTrails':
2019-01-11 10:09:47 +08:00
print("[*] Searching SecurityTrails.")
from discovery import securitytrailssearch
try:
2019-01-05 00:28:11 +08:00
search = securitytrailssearch.search_securitytrail(
word)
search.process()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, hosts, 'host', 'securityTrails')
ips = search.get_ips()
all_ip.extend(ips)
db = stash.stash_manager()
db.store_all(word, ips, 'ip', 'securityTrails')
except Exception as e:
if isinstance(e, MissingKey):
print(e)
else:
pass
2018-12-23 04:29:11 +08:00
elif engineitem == "threatcrowd":
2019-01-11 10:09:47 +08:00
print("[*] Searching Threatcrowd.")
try:
search = threatcrowd.search_threatcrowd(word)
search.process()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
2019-01-06 13:14:46 +08:00
db.store_all(word, all_hosts, 'host', 'threatcrowd')
except Exception:
pass
2018-12-16 11:07:37 +08:00
elif engineitem == "trello":
2019-01-11 10:09:47 +08:00
print("[*] Searching Trello.")
from discovery import trello
2018-12-27 15:43:32 +08:00
# Import locally or won't work.
search = trello.search_trello(word, limit)
search.process()
emails = filter(search.get_emails())
all_emails.extend(emails)
info = search.get_urls()
hosts = filter(info[0])
trello_info = (info[1], True)
all_hosts.extend(hosts)
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
db.store_all(word, hosts, 'host', 'trello')
db.store_all(word, emails, 'email', 'trello')
2018-12-16 11:07:37 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "twitter":
2019-01-11 10:09:47 +08:00
print("[*] Searching Twitter.")
2018-12-23 04:29:11 +08:00
search = twittersearch.search_twitter(word, limit)
search.process()
people = search.get_people()
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, people, 'name', 'twitter')
print("\nUsers from Twitter:")
2018-12-23 04:29:11 +08:00
print("-------------------")
for user in people:
print(user)
sys.exit()
2018-12-16 11:07:37 +08:00
2018-12-23 04:29:11 +08:00
# vhost
2018-12-16 11:07:37 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "virustotal":
2019-01-11 10:09:47 +08:00
print("[*] Searching VirusTotal.")
2018-12-23 04:29:11 +08:00
search = virustotal.search_virustotal(word)
search.process()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'virustotal')
2018-12-16 11:07:37 +08:00
2018-12-23 04:29:11 +08:00
elif engineitem == "yahoo":
2019-01-11 10:09:47 +08:00
print("[*] Searching Yahoo.")
2018-12-23 04:29:11 +08:00
search = yahoosearch.search_yahoo(word, limit)
search.process()
hosts = search.get_hostnames()
emails = search.get_emails()
all_hosts.extend(filter(hosts))
all_emails.extend(filter(emails))
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'yahoo')
db.store_all(word, all_emails, 'email', 'yahoo')
elif engineitem == "all":
2018-11-23 05:20:06 +08:00
print(("Full harvest on " + word))
all_emails = []
all_hosts = []
2018-12-16 11:07:37 +08:00
try:
2019-01-11 10:09:47 +08:00
print("[*] Searching Baidu.")
search = baidusearch.SearchBaidu(word, limit)
search.process()
all_emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'baidu')
db.store_all(word, all_emails, 'email', 'baidu')
except Exception:
pass
2018-12-23 04:29:11 +08:00
2019-01-11 10:09:47 +08:00
print("[*] Searching Bing.")
2018-12-23 04:29:11 +08:00
bingapi = "no"
search = bingsearch.SearchBing(word, limit, start)
2018-12-23 04:29:11 +08:00
search.process(bingapi)
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'bing')
all_emails.extend(emails)
2018-12-23 04:29:11 +08:00
all_emails = sorted(set(all_emails))
db.store_all(word, all_emails, 'email', 'bing')
2018-12-16 11:07:37 +08:00
2019-01-11 10:09:47 +08:00
print("[*] Searching Censys.")
2018-12-23 04:29:11 +08:00
from discovery import censys
search = censys.SearchCensys(word, limit)
search.process()
ips = search.get_ipaddresses()
setips = set(ips)
2018-12-27 15:43:32 +08:00
uniqueips = list(setips) # Remove duplicates.
all_ip.extend(uniqueips)
hosts = filter(search.get_hostnames())
sethosts = set(hosts)
2018-12-27 15:43:32 +08:00
uniquehosts = list(sethosts) # Remove duplicates.
all_hosts.extend(uniquehosts)
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
db.store_all(word, uniquehosts, 'host', 'censys')
db.store_all(word, uniqueips, 'ip', 'censys')
2019-01-11 10:09:47 +08:00
print("[*] Searching CRT.sh.")
search = crtsh.search_crtsh(word)
search.process()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'CRTsh')
2018-12-23 04:29:11 +08:00
# cymon
2018-11-11 22:24:58 +08:00
2018-12-23 04:29:11 +08:00
# dogpile
2019-01-11 10:09:47 +08:00
print("[*] Searching DuckDuckGo.")
from discovery import duckduckgosearch
search = duckduckgosearch.SearchDuckDuckGo(word, limit)
search.process()
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
all_emails.extend(emails)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'email', 'duckduckgo')
db.store_all(word, all_hosts, 'host', 'duckduckgo')
2019-01-11 10:09:47 +08:00
print("[*] Searching Google.")
2018-12-23 04:29:11 +08:00
search = googlesearch.search_google(word, limit, start)
search.process(google_dorking)
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
2018-12-23 04:29:11 +08:00
all_emails.extend(emails)
db = stash.stash_manager()
db.store_all(word, all_emails, 'email', 'google')
all_hosts.extend(hosts)
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'google')
2019-01-11 10:09:47 +08:00
print("[*] Searching Google Certificate transparency report.")
search = googlecertificates.SearchGoogleCertificates(
2019-01-05 00:28:11 +08:00
word, limit, start)
2018-12-23 04:29:11 +08:00
search.process()
domains = filter(search.get_domains())
2018-12-23 04:29:11 +08:00
all_hosts.extend(domains)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'google-certificates')
2018-12-23 04:29:11 +08:00
try:
2019-01-11 10:09:47 +08:00
print("[*] Searching Google profiles.")
search = googlesearch.search_google(word, limit, start)
search.process_profiles()
people = search.get_profiles()
db = stash.stash_manager()
db.store_all(word, people, 'name', 'google-profile')
print("\nUsers from Google profiles:")
print("---------------------------")
for users in people:
print(users)
except Exception:
pass
2018-11-03 07:04:20 +08:00
2019-01-11 10:09:47 +08:00
print("[*] Searching Hunter.")
2018-11-11 22:24:58 +08:00
from discovery import huntersearch
2018-12-27 15:43:32 +08:00
# Import locally.
try:
search = huntersearch.SearchHunter(word, limit, start)
search.process()
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, hosts, 'host', 'hunter')
all_emails.extend(emails)
all_emails = sorted(set(all_emails))
db.store_all(word, all_emails, 'email', 'hunter')
except Exception as e:
if isinstance(e, MissingKey):
print(e)
else:
pass
2018-12-27 15:43:32 +08:00
2018-12-23 04:29:11 +08:00
# linkedin
2019-01-11 10:09:47 +08:00
print("[*] Searching Netcraft.")
search = netcraft.SearchNetcraft(word)
search.process()
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'netcraft')
2019-01-11 10:09:47 +08:00
print("[*] Searching PGP key server.")
try:
search = pgpsearch.SearchPgp(word)
search.process()
emails = filter(search.get_emails())
hosts = filter(search.get_hostnames())
sethosts = set(hosts)
2018-12-27 15:43:32 +08:00
uniquehosts = list(sethosts) # Remove duplicates.
all_hosts.extend(uniquehosts)
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'PGP')
all_emails.extend(emails)
db = stash.stash_manager()
db.store_all(word, all_emails, 'email', 'PGP')
except Exception:
pass
2018-11-23 05:20:06 +08:00
2019-01-11 10:09:47 +08:00
print("[*] Searching Threatcrowd.")
2018-12-23 04:29:11 +08:00
try:
search = threatcrowd.search_threatcrowd(word)
search.process()
hosts = filter(search.get_hostnames())
2018-12-23 04:29:11 +08:00
all_hosts.extend(hosts)
db = stash.stash_manager()
2019-01-06 13:14:46 +08:00
db.store_all(word, all_hosts, 'host', 'threatcrowd')
except Exception:
pass
2018-12-23 04:29:11 +08:00
2019-01-11 10:09:47 +08:00
print("[*] Searching Trello.")
from discovery import trello
2018-12-27 15:43:32 +08:00
# Import locally or won't work.
search = trello.search_trello(word, limit)
search.process()
emails = filter(search.get_emails())
all_emails.extend(emails)
info = search.get_urls()
hosts = filter(info[0])
trello_info = (info[1], True)
all_hosts.extend(hosts)
db = stash.stash_manager()
db.store_all(word, hosts, 'host', 'trello')
db.store_all(word, emails, 'email', 'trello')
try:
2019-01-11 10:09:47 +08:00
print("[*] Searching Twitter.")
search = twittersearch.search_twitter(word, limit)
search.process()
people = search.get_people()
db = stash.stash_manager()
db.store_all(word, people, 'name', 'twitter')
print("\nUsers from Twitter:")
print("-------------------")
for user in people:
print(user)
except Exception:
pass
2018-12-23 04:29:11 +08:00
# vhost
2019-01-11 10:09:47 +08:00
print("[*] Searching VirusTotal.")
2018-12-23 04:29:11 +08:00
search = virustotal.search_virustotal(word)
2018-12-23 02:46:27 +08:00
search.process()
2018-12-27 15:43:32 +08:00
hosts = filter(search.get_hostnames())
all_hosts.extend(hosts)
2018-12-23 02:46:27 +08:00
db = stash.stash_manager()
2018-12-23 04:29:11 +08:00
db.store_all(word, all_hosts, 'host', 'virustotal')
2019-01-11 10:09:47 +08:00
print("[*] Searching Yahoo.")
search = yahoosearch.search_yahoo(word, limit)
search.process()
hosts = search.get_hostnames()
emails = search.get_emails()
all_hosts.extend(filter(hosts))
all_emails.extend(filter(emails))
db = stash.stash_manager()
db.store_all(word, all_hosts, 'host', 'yahoo')
db.store_all(word, all_emails, 'email', 'yahoo')
2018-11-11 22:24:58 +08:00
else:
2019-01-11 10:09:47 +08:00
print("\033[93m[!] Invalid source.\n\n \033[0m")
2018-12-27 15:43:32 +08:00
sys.exit(1)
2018-11-11 22:24:58 +08:00
# Results
2018-12-27 15:43:32 +08:00
if len(all_ip) == 0:
2018-12-23 04:29:11 +08:00
print("No IP addresses found.")
2018-12-20 03:39:33 +08:00
else:
2019-01-11 10:09:47 +08:00
print("\033[1;33;40m \n[*] IP addresses found:")
2018-12-27 16:18:28 +08:00
print("-----------------------")
print("Total IP addresses: " + str(len(all_ip)) + "\n")
for ip in sorted(list(set(all_ip))):
print(ip)
2018-12-27 16:18:28 +08:00
print("\n[+] Emails found:")
print("-----------------")
2018-12-27 15:43:32 +08:00
# Sanity check to see if all_emails and all_hosts are defined.
2018-11-23 05:20:06 +08:00
try:
all_emails
except NameError:
print('No emails found as all_emails is not defined.')
2018-12-27 15:43:32 +08:00
sys.exit(1)
2018-11-23 05:20:06 +08:00
try:
all_hosts
except NameError:
print('No hosts found as all_hosts is not defined.')
2018-12-27 15:43:32 +08:00
sys.exit(1)
2018-11-23 05:20:06 +08:00
if all_emails == []:
2018-12-23 04:29:11 +08:00
print("No emails found.")
else:
print("Total emails: " + str(len(all_emails)) + "\n")
print(("\n".join(sorted(list(set(all_emails))))))
2018-12-27 16:18:28 +08:00
print("\033[1;33;40m \n[+] Hosts found:")
print("----------------")
if all_hosts == []:
2018-12-23 04:29:11 +08:00
print("No hosts found.")
else:
2018-03-23 06:32:50 +08:00
total = len(all_hosts)
2018-12-27 16:18:28 +08:00
print(("Total hosts: " + str(total) + "\n"))
all_hosts = sorted(list(set(all_hosts)))
for host in all_hosts:
print(host)
2019-01-11 10:09:47 +08:00
print("\033[94m \n[*] Resolving hostnames to IPs.\033[1;33;40m")
print("-------------------------------")
full_host = hostchecker.Checker(all_hosts)
full = full_host.check()
for host in full:
2018-04-16 19:55:52 +08:00
ip = host.split(':')[1]
2018-11-23 05:20:06 +08:00
print(host)
if ip != "empty":
if host_ip.count(ip.lower()):
pass
else:
host_ip.append(ip.lower())
2018-12-16 11:07:37 +08:00
2018-12-20 03:39:33 +08:00
db = stash.stash_manager()
db.store_all(word, host_ip, 'ip', 'DNS-resolver')
2019-01-11 10:09:47 +08:00
if trello_info[1] is True:
print("\033[1;33;40m \n[*] URLs found from Trello:")
2018-12-27 15:43:32 +08:00
print("--------------------------")
trello_urls = trello_info[0]
if trello_urls == []:
2018-12-27 15:43:32 +08:00
print('\nNo Trello URLs found.')
else:
total = len(trello_urls)
2018-12-27 15:43:32 +08:00
print(("\nTotal URLs: " + str(total) + "\n"))
for url in sorted(list(set(trello_urls))):
print(url)
2019-01-11 10:09:47 +08:00
# DNS brute force
dnsres = []
if dnsbrute is True:
2019-01-11 10:09:47 +08:00
print("\n\033[94m[*] Starting DNS brute force. \033[1;33;40m")
a = dnssearch.dns_force(word, dnsserver, verbose=True)
res = a.process()
2019-01-11 10:09:47 +08:00
print("\n\033[94m[*] Hosts found after DNS brute force:")
2018-12-27 15:43:32 +08:00
print("-------------------------------------")
for y in res:
2018-11-23 05:20:06 +08:00
print(y)
dnsres.append(y.split(':')[0])
if y not in full:
full.append(y)
2018-12-16 11:07:37 +08:00
db = stash.stash_manager()
db.store_all(word, dnsres, 'host', 'dns_bruteforce')
2019-01-11 10:09:47 +08:00
# Port scanning
if ports_scanning is True:
2019-01-11 10:09:47 +08:00
print("\n\n\033[1;32;40m[*] Scanning ports (active).\n")
2018-12-16 11:07:37 +08:00
for x in full:
host = x.split(':')[1]
domain = x.split(':')[0]
if host != "empty":
2019-01-11 10:09:47 +08:00
print(("[*] Scanning " + host))
2018-12-27 15:43:32 +08:00
ports = [21, 22, 80, 443, 8080]
2018-12-16 11:07:37 +08:00
try:
2019-01-01 10:38:32 +08:00
scan = port_scanner.PortScan(host, ports)
2018-12-16 11:07:37 +08:00
openports = scan.process()
if len(openports) > 1:
print(("\t\033[91m Detected open ports: " + ','.join(
str(e) for e in openports) + "\033[1;32;40m"))
2018-12-16 11:07:37 +08:00
takeover_check = 'True'
if takeover_check == 'True':
if len(openports) > 0:
search_take = takeover.take_over(domain)
search_take.process()
except Exception as e:
print(e)
# DNS reverse lookup
dnsrev = []
if dnslookup is True:
2019-01-11 10:09:47 +08:00
print("\n[*] Starting active queries.")
analyzed_ranges = []
2018-04-16 19:55:52 +08:00
for x in host_ip:
2018-11-23 05:20:06 +08:00
print(x)
ip = x.split(":")[0]
range = ip.split(".")
range[3] = "0/24"
2018-11-23 05:20:06 +08:00
s = '.'
range = s.join(range)
if not analyzed_ranges.count(range):
2019-01-05 00:28:11 +08:00
print(
2019-01-11 10:09:47 +08:00
("\033[94m[*] Performing reverse lookup in " + range + "\033[1;33;40m"))
a = dnssearch.dns_reverse(range, True)
a.list()
res = a.process()
analyzed_ranges.append(range)
else:
continue
for x in res:
if x.count(word):
dnsrev.append(x)
if x not in full:
full.append(x)
2018-11-23 05:20:06 +08:00
print("Hosts found after reverse lookup (in target domain):")
2018-12-27 15:43:32 +08:00
print("----------------------------------------------------")
for xh in dnsrev:
2018-11-23 05:20:06 +08:00
print(xh)
2018-12-16 11:07:37 +08:00
# DNS TLD expansion
dnstldres = []
if dnstld is True:
2019-01-11 10:09:47 +08:00
print("[*] Starting DNS TLD expansion.")
a = dnssearch.dns_tld(word, dnsserver, verbose=True)
res = a.process()
2019-01-11 10:09:47 +08:00
print("\n[*] Hosts found after DNS TLD expansion:")
2018-12-27 15:43:32 +08:00
print("----------------------------------------")
for y in res:
2018-11-23 05:20:06 +08:00
print(y)
dnstldres.append(y)
if y not in full:
full.append(y)
# Virtual hosts search
if virtual == "basic":
2019-01-11 10:09:47 +08:00
print("\n[*] Virtual hosts:")
2018-11-23 05:20:06 +08:00
print("------------------")
for l in host_ip:
search = bingsearch.SearchBing(l, limit, start)
search.process_vhost()
res = search.get_allhostnames()
for x in res:
2018-12-16 11:07:37 +08:00
x = re.sub(r'[[\<\/?]*[\w]*>]*', '', x)
x = re.sub('<', '', x)
x = re.sub('>', '', x)
2018-11-23 05:20:06 +08:00
print((l + "\t" + x))
vhost.append(l + ":" + x)
full.append(l + ":" + x)
2018-12-16 11:07:37 +08:00
vhost = sorted(set(vhost))
else:
pass
2018-12-27 15:43:32 +08:00
2019-01-11 10:09:47 +08:00
# Shodan
shodanres = []
2019-01-05 00:28:11 +08:00
import texttable
tab = texttable.Texttable()
header = ["IP address", "Hostname", "Org",
"Services:Ports", "Technologies"]
tab.header(header)
tab.set_cols_align(["c", "c", "c", "c", "c"])
tab.set_cols_valign(["m", "m", "m", "m", "m"])
tab.set_chars(['-', '|', '+', '#'])
tab.set_cols_width([15, 20, 15, 15, 18])
host_ip = list(set(host_ip))
2019-01-01 07:37:47 +08:00
if shodan is True:
2019-01-11 10:09:47 +08:00
print("\n\n\033[1;32;40m[*] Shodan DB search (passive):\n")
2019-01-05 00:28:11 +08:00
try:
for ip in host_ip:
print(("\tSearching for: " + ip))
shodan = shodansearch.search_shodan()
rowdata = shodan.search_ip(ip)
time.sleep(2)
tab.add_row(rowdata)
printedtable = tab.draw()
2019-01-11 10:09:47 +08:00
print("\n [*] Shodan results:")
2019-01-05 00:28:11 +08:00
print("-------------------")
print(printedtable)
except Exception as e:
print(f'Error occurred in theHarvester - Shodan search module: {e}')
else:
pass
2018-12-23 04:29:11 +08:00
# Here we need to add explosion mode.
2019-01-11 10:09:47 +08:00
# We have to take out the TLDs to do this.
recursion = None
if recursion:
start = 0
for word in vhost:
search = googlesearch.search_google(word, limit, start)
search.process(google_dorking)
emails = search.get_emails()
hosts = search.get_hostnames()
2018-11-23 05:20:06 +08:00
print(emails)
print(hosts)
else:
pass
# Reporting
if filename != "":
try:
2018-12-27 15:43:32 +08:00
print("NEW REPORTING BEGINS.")
2018-12-16 01:22:02 +08:00
db = stash.stash_manager()
scanboarddata = db.getscanboarddata()
latestscanresults = db.getlatestscanresults(word)
2019-01-05 00:28:11 +08:00
previousscanresults = db.getlatestscanresults(
word, previousday=True)
latestscanchartdata = db.latestscanchartdata(word)
scanhistorydomain = db.getscanhistorydomain(word)
pluginscanstatistics = db.getpluginscanstatistics()
2018-12-16 01:22:02 +08:00
generator = statichtmlgenerator.htmlgenerator(word)
HTMLcode = generator.beginhtml()
HTMLcode += generator.generatelatestscanresults(latestscanresults)
2019-01-05 00:28:11 +08:00
HTMLcode += generator.generatepreviousscanresults(
previousscanresults)
2018-12-16 01:22:02 +08:00
graph = reportgraph.graphgenerator(word)
HTMLcode += graph.drawlatestscangraph(word, latestscanchartdata)
2019-01-05 00:28:11 +08:00
HTMLcode += graph.drawscattergraphscanhistory(
word, scanhistorydomain)
HTMLcode += generator.generatepluginscanstatistics(
pluginscanstatistics)
HTMLcode += generator.generatedashboardcode(scanboarddata)
HTMLcode += '<p><span style="color: #000000;">Report generated on ' + str(
datetime.datetime.now()) + '</span></p>'
2018-12-20 03:39:33 +08:00
HTMLcode += '''
</body>
</html>
'''
Html_file = open("report.html", "w")
2018-12-16 01:22:02 +08:00
Html_file.write(HTMLcode)
Html_file.close()
print("NEW REPORTING FINISHED!")
2018-12-27 15:43:32 +08:00
print("[+] Saving files.")
html = htmlExport.htmlExport(
all_emails,
full,
vhost,
dnsres,
dnsrev,
filename,
word,
shodanres,
dnstldres)
save = html.writehtml()
except Exception as e:
2018-11-23 05:20:06 +08:00
print(e)
2018-12-23 04:29:11 +08:00
print("Error creating the file.")
try:
filename = filename.split(".")[0] + ".xml"
file = open(filename, 'w')
file.write('<?xml version="1.0" encoding="UTF-8"?><theHarvester>')
for x in all_emails:
file.write('<email>' + x + '</email>')
for x in full:
x = x.split(":")
if len(x) == 2:
2019-01-05 00:28:11 +08:00
file.write(
'<host>' + '<ip>' + x[1] + '</ip><hostname>' + x[0] + '</hostname>' + '</host>')
else:
file.write('<host>' + x + '</host>')
for x in vhost:
x = x.split(":")
if len(x) == 2:
2019-01-05 00:28:11 +08:00
file.write(
'<vhost>' + '<ip>' + x[1] + '</ip><hostname>' + x[0] + '</hostname>' + '</vhost>')
else:
file.write('<vhost>' + x + '</vhost>')
if shodanres != []:
shodanalysis = []
for x in shodanres:
res = x.split("SAPO")
file.write('<shodan>')
file.write('<host>' + res[0] + '</host>')
file.write('<port>' + res[2] + '</port>')
file.write('<banner><!--' + res[1] + '--></banner>')
reg_server = re.compile('Server:.*')
temp = reg_server.findall(res[1])
if temp != []:
shodanalysis.append(res[0] + ":" + temp[0])
file.write('</shodan>')
if shodanalysis != []:
2018-12-16 11:07:37 +08:00
shodanalysis = sorted(set(shodanalysis))
file.write('<servers>')
for x in shodanalysis:
file.write('<server>' + x + '</server>')
file.write('</servers>')
2018-12-23 04:29:11 +08:00
file.write('</theHarvester>')
2016-03-05 23:25:44 +08:00
file.flush()
file.close()
2018-11-23 05:20:06 +08:00
print("Files saved!")
except Exception as er:
print(f'Error saving XML file: {er}')
sys.exit()
2018-12-16 11:07:37 +08:00
if __name__ == "__main__":
try:
start(sys.argv[1:])
except KeyboardInterrupt:
2019-01-11 10:09:47 +08:00
print("\n\n\033[93m[!] ctrl+c detected from user, quitting.\n\n \033[0m")
2018-11-23 05:20:06 +08:00
except Exception:
import traceback
print(traceback.print_exc())
sys.exit(1)