import myparser import re import requests import time from discovery.constants import * class search_ask: def __init__(self, word, limit): self.word = word.replace(' ', '%20') self.results = "" self.totalresults = "" self.server = "www.ask.com" self.hostname = "www.ask.com" self.quantity = "100" self.limit = int(limit) self.counter = 0 def do_search(self): headers = { 'User-agent': getUserAgent() } url = 'http://' + self.server + '/web?q=%40' + self.word \ + "&pu=100&page=" + str(self.counter) h = requests.get(url=url, headers=headers) time.sleep(getDelay()) self.results = h.text self.totalresults += self.results def check_next(self): renext = re.compile('> Next <') nextres = renext.findall(self.results) if nextres != []: nexty = "1" else: nexty = "0" return nexty def get_people(self): rawres = myparser.parser(self.totalresults, self.word) return rawres.people_jigsaw() def process(self): while (self.counter < self.limit): self.do_search() more = self.check_next() if more == "1": self.counter += 100 else: break