class MySpider(Spider): def init(self, login, password): link = "http://freeerisa.benefitspro.com" self.login = login self.password = password self.cj = cookielib.CookieJar() self.opener = urllib2.build_opener( urllib2.HTTPRedirectHandler(), urllib2.HTTPHandler(debuglevel=0), urllib2.HTTPSHandler(debuglevel=0), urllib2.HTTPCookieProcessor(self.cj) ) self.loginToFreeErissa() self.loginToFreeErissa() def loginToFreeErissa(self): login_data = urllib.urlencode({ 'MainContent_mainContent_txtEmail' : self.login, 'MainContent_mainContent_txtPassword' : self.password, }) response = self.opener.open(link + "/login.aspx", login_data) return ''.join(response.readlines()) def after_login(self, response): if "Error while logging in" in response.body: self.logger.error("Login failed!") else: url = [link + "/5500/plandetails.aspx?Ein=042088633", link + "/5500/plandetails.aspx?Ein=046394579"] for u in url: g_data =soup.find_all("span") for item in g_data: return item.text
Aucun commentaire:
Enregistrer un commentaire