Rev 14325 | Rev 15270 | Go to most recent revision | Blame | Compare with Previous | Last modification | View Log | RSS feed
import urllib2import simplejson as jsonimport pymongofrom dtr.utils.utils import to_java_datefrom datetime import datetime, timedeltaimport timefrom multiprocessing import Pool as ThreadPoolfrom multiprocessing import cpu_countimport optparsefrom dtr.storage.MemCache import MemCachecon = Noneparser = optparse.OptionParser()parser.add_option("-m", "--m", dest="mongoHost",default="localhost",type="string", help="The HOST where the mongo server is running",metavar="mongo_host")(options, args) = parser.parse_args()mc = MemCache(options.mongoHost)headers = {'User-agent':'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/535.11 (KHTML, like Gecko) Chrome/17.0.963.56 Safari/535.11','Accept' : 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8','Accept-Language' : 'en-US,en;q=0.8','Accept-Charset' : 'ISO-8859-1,utf-8;q=0.7,*;q=0.3'}def get_mongo_connection(host=options.mongoHost, port=27017):global conif con is None:print "Establishing connection %s host and port %d" %(host,port)try:con = pymongo.MongoClient(host, port)except Exception, e:print ereturn Nonereturn condef populate():toScrapMap = {}bestSellers = list(get_mongo_connection().Catalog.MasterData.find({'rank':{'$gt':0}}))for bestSeller in bestSellers:snapdealBestSellers = list(get_mongo_connection().Catalog.MasterData.find({'skuBundleId':bestSeller['skuBundleId'],'source_id':3}))for data in snapdealBestSellers:if not toScrapMap.has_key(data['_id']):toScrapMap[data['_id']] = datadealFlagged = list(get_mongo_connection().Catalog.Deals.find({'source_id':3,'showDeal':1,'totalPoints':{'$gt':0}}))for deal in dealFlagged:if not toScrapMap.has_key(deal['_id']):data = list(get_mongo_connection().Catalog.MasterData.find({'_id':deal['_id']}))toScrapMap[deal['_id']] = data[0]pool = ThreadPool(cpu_count() *2)pool.map(updatePrices,toScrapMap.values())pool.close()pool.join()print "joining threads at %s"%(str(datetime.now()))def updatePrices(data):if data['source_id']!=3:returnprint data['identifier']if data['identifier'] is None or len(data['identifier'].strip())==0:print "returning"returntry:if data['priceUpdatedOn'] > to_java_date(datetime.now() - timedelta(minutes=5)):print "sku id is already updated",data['_id']returnexcept:passurl="http://www.snapdeal.com/acors/json/gvbps?supc=%s&catId=175&sort=sellingPrice"%(data['identifier'].strip())print urltime.sleep(1)lowestOfferPrice = 0instock = 0req = urllib2.Request(url,headers=headers)response = urllib2.urlopen(req)json_input = response.read()response.close()if len(json_input) > 0:vendorInfo = json.loads(json_input)for vendor in vendorInfo:lowestOfferPrice = float(vendor['sellingPrice'])try:stock = vendor['buyableInventory']except:stock = 0if stock > 0 and lowestOfferPrice > 0:instock = 1breakelse:lowestOfferPrice = 0stock = 0instock = 0print lowestOfferPriceprint instockprint stockprint "Lowest Offer Price for id %d is %d , stock is %d and stock count is %d" %(data['_id'],lowestOfferPrice,instock,stock)print "*************"if instock == 1:get_mongo_connection().Catalog.MasterData.update({'_id':data['_id']}, {'$set' : {'available_price':lowestOfferPrice,'updatedOn':to_java_date(datetime.now()),'priceUpdatedOn':to_java_date(datetime.now()),'in_stock':instock}}, multi=True)get_mongo_connection().Catalog.Deals.update({'_id':data['_id']}, {'$set' : {'available_price':lowestOfferPrice , 'in_stock':instock}}, multi=True)else:get_mongo_connection().Catalog.MasterData.update({'_id':data['_id']}, {'$set' : {'updatedOn':to_java_date(datetime.now()),'in_stock':instock,'priceUpdatedOn':to_java_date(datetime.now())}}, multi=True)get_mongo_connection().Catalog.Deals.update({'_id':data['_id']}, {'$set' : {'in_stock':instock}}, multi=True)try:recomputeDeal(data['skuBundleId'])except:print "Unable to compute deal for ",data['skuBundleId']def populateNegativeDeals():negativeDeals = get_mongo_connection().Catalog.NegativeDeals.find().distinct('sku')mc.set("negative_deals", negativeDeals, 600)def recomputeDeal(skuBundleId):"""Lets recompute deal for this bundle"""print "Recomputing for bundleId",skuBundleIdsimilarItems = list(get_mongo_connection().Catalog.Deals.find({'skuBundleId':skuBundleId}).sort([('available_price',pymongo.ASCENDING)]))bestPrice = float("inf")bestOne = NonebestSellerPoints = 0toUpdate = []for similarItem in similarItems:if mc.get("negative_deals") is None:populateNegativeDeals()if similarItem['in_stock'] == 0 or similarItem['maxprice'] is None or similarItem['maxprice'] < similarItem['available_price'] or similarItem['_id'] in mc.get("negative_deals"):get_mongo_connection().Catalog.Deals.update({ '_id' : similarItem['_id'] }, {'$set':{'showDeal':0 }})continueif similarItem['available_price'] < bestPrice:bestOne = similarItembestPrice = similarItem['available_price']bestSellerPoints = similarItem['bestSellerPoints']elif similarItem['available_price'] == bestPrice and bestSellerPoints < similarItem['bestSellerPoints']:bestOne = similarItembestPrice = similarItem['available_price']bestSellerPoints = similarItem['bestSellerPoints']else:passif bestOne is not None:for similarItem in similarItems:toUpdate.append(similarItem['_id'])toUpdate.remove(bestOne['_id'])get_mongo_connection().Catalog.Deals.update({ '_id' : bestOne['_id'] }, {'$set':{'showDeal':1 }})if len(toUpdate) > 0:get_mongo_connection().Catalog.Deals.update({ '_id' : { "$in": toUpdate } }, {'$set':{'showDeal':0 }},upsert=False, multi=True)def main():populate()if __name__=='__main__':main()