theHarvester/discovery/trello.py

from discovery.constants import *
from parsers import myparser
import requests
import time


class search_trello:

    def __init__(self, word, limit):
        self.word = word.replace(' ', '%20')
        self.results = ""
        self.totalresults = ""
        self.server = "www.google.com"
        self.hostname = "www.google.com"
        self.quantity = "100"
        self.limit = limit
        self.counter = 0

    def do_search(self):
        try:
            urly = "https://" + self.server + "/search?num=100&start=" + str(
                self.counter) + "&hl=en&q=site%3Atrello.com%20" + self.word
        except Exception as e:
            print(e)
        headers = {'User-Agent': googleUA}
        try:
            r = requests.get(urly, headers=headers)
            time.sleep(getDelay())
        except Exception as e:
            print(e)
        self.results = r.text
        self.totalresults += self.results

    def get_emails(self):
        rawres = myparser.Parser(self.totalresults, self.word)
        return rawres.emails()

    def get_urls(self):
        print('\tSearching Trello URLs.')
        try:
            rawres = myparser.Parser(self.totalresults, "trello.com")
            trello_urls = rawres.urls()
            visited = set()
            for url in trello_urls:
                # Iterate through Trello URLs gathered and visit them, append text to totalresults.
                if url not in visited:  # Make sure visiting unique URLs.
                    visited.add(url)
                    self.totalresults += requests.get(url=url, headers={'User-Agent': googleUA}).text
            rawres = myparser.Parser(self.totalresults, self.word)
            return rawres.hostnames(), trello_urls
        except Exception as e:
            print(f'Error occurred: {e}')

    def process(self):
        while self.counter < self.limit:
            self.do_search()
            if search(self.results):
                time.sleep(getDelay() * 5)
            else:
                time.sleep(getDelay())
            self.counter += 100
            print(f'\tSearching {self.counter} results.')
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`from discovery.constants import *`
Cosmetic, comments, and alphbetize. 2019-01-11 10:09:47 +08:00			`from parsers import myparser`
			`import requests`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`import time`


			`class search_trello:`

			`def __init__(self, word, limit):`
			`self.word = word.replace(' ', '%20')`
			`self.results = ""`
			`self.totalresults = ""`
			`self.server = "www.google.com"`
			`self.hostname = "www.google.com"`
			`self.quantity = "100"`
			`self.limit = limit`
			`self.counter = 0`

			`def do_search(self):`
			`try:`
			`urly = "https://" + self.server + "/search?num=100&start=" + str(`
			`self.counter) + "&hl=en&q=site%3Atrello.com%20" + self.word`
			`except Exception as e:`
			`print(e)`
			`headers = {'User-Agent': googleUA}`
			`try:`
			`r = requests.get(urly, headers=headers)`
			`time.sleep(getDelay())`
			`except Exception as e:`
			`print(e)`
			`self.results = r.text`
			`self.totalresults += self.results`

			`def get_emails(self):`
Update a lot of things to be pep8, fixed some missing engines from the all flag, introduce pytest for tests, f-stringify some things 2019-01-06 17:50:07 +08:00			`rawres = myparser.Parser(self.totalresults, self.word)`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`return rawres.emails()`

			`def get_urls(self):`
Cosmetic and deleted jigsaw. 2019-01-11 15:21:45 +08:00			`print('\tSearching Trello URLs.')`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`try:`
Update a lot of things to be pep8, fixed some missing engines from the all flag, introduce pytest for tests, f-stringify some things 2019-01-06 17:50:07 +08:00			`rawres = myparser.Parser(self.totalresults, "trello.com")`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`trello_urls = rawres.urls()`
			`visited = set()`
			`for url in trello_urls:`
Cosmetic, comments, and alphbetize. 2019-01-11 10:09:47 +08:00			`# Iterate through Trello URLs gathered and visit them, append text to totalresults.`
			`if url not in visited: # Make sure visiting unique URLs.`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`visited.add(url)`
			`self.totalresults += requests.get(url=url, headers={'User-Agent': googleUA}).text`
Update a lot of things to be pep8, fixed some missing engines from the all flag, introduce pytest for tests, f-stringify some things 2019-01-06 17:50:07 +08:00			`rawres = myparser.Parser(self.totalresults, self.word)`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00			`return rawres.hostnames(), trello_urls`
			`except Exception as e:`
Update a lot of things to be pep8, fixed some missing engines from the all flag, introduce pytest for tests, f-stringify some things 2019-01-06 17:50:07 +08:00			`print(f'Error occurred: {e}')`
Major tidy up of code to make certain things pep8 compliant and put parsers in to there own directory to tidy up the root tree 2018-12-28 08:49:56 +08:00
			`def process(self):`
			`while self.counter < self.limit:`
			`self.do_search()`
			`if search(self.results):`
			`time.sleep(getDelay() * 5)`
			`else:`
			`time.sleep(getDelay())`
			`self.counter += 100`
Cosmetic and deleted jigsaw. 2019-01-11 15:21:45 +08:00			`print(f'\tSearching {self.counter} results.')`