WebSVN – SmartDukaan – Diff – /trunk/PriceComparisonFramework/src/Scrapers/InfibeamScraper.py

         html = BaseScraper.read(self, self.url)
         self.soup = BeautifulSoup(html)
     def getPhones(self):
         phone_prices = []
+        if self.url.find('Cameras') !=-1 :
+            ulTagClass = 'srch_result landscape'
+        else :
+            ulTagClass = 'srch_result portrait'
-        for li in self.soup.findAll('ul', {'class': 'srch_result portrait'})[0]('li'):
+        for li in self.soup.findAll('ul', {'class': ulTagClass})[0]('li'):
             name = li.find('span', {'class': 'title'}).contents[1].strip()
             try:
                 price = li.find('div', {'class': 'price'}).find('span', {'class': 'normal'}).string
             except IndexError:
     def getNextUrl(self):
         b = self.soup.findAll('div', {'class': 'resultsSummary'})[0].findAll('b')
         current_max = int(b[0].string.split('-')[1])
         total_products = int(b[1].string)
+        urlDivider = self.url.find('page=')
-        return 'http://www.infibeam.com/Mobiles/search?page=%d' % (1 + current_max / 20) if current_max < total_products else None
+        return self.url[:urlDivider] + 'page=%d' % (1 + current_max / 20) if current_max < total_products else None
     def getDataFromProductPage(self, url):
         html = BaseScraper.read(self, url)
         soup = BeautifulSoup(html)
         name = soup.find('div', {'id': 'ib_details'}).find('h1', {'class': "fn"}).find('span', {'class': "item"}).string.strip()

Subversion Repositories SmartDukaan