Subversion Repositories SmartDukaan

Rev

Rev 20361 | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
13828 kshitij.so 1
import pymongo
20347 kshitij.so 2
from dtr.utils.utils import to_java_date, DEAL_PRIORITY
13914 kshitij.so 3
from datetime import datetime, timedelta
14256 kshitij.so 4
import optparse
14325 kshitij.so 5
from dtr.storage.MemCache import MemCache
14705 kshitij.so 6
from dtr.utils.utils import getCashBack
20311 kshitij.so 7
from shop2020.model.v1.catalog.script import AmazonAsyncScraper
20347 kshitij.so 8
import traceback
13828 kshitij.so 9
 
20311 kshitij.so 10
 
13828 kshitij.so 11
con = None
12
 
14256 kshitij.so 13
parser = optparse.OptionParser()
14
parser.add_option("-m", "--m", dest="mongoHost",
15
                      default="localhost",
16
                      type="string", help="The HOST where the mongo server is running",
17
                      metavar="mongo_host")
18
 
19
(options, args) = parser.parse_args()
20
 
14325 kshitij.so 21
mc = MemCache(options.mongoHost)
20311 kshitij.so 22
amScraper = AmazonAsyncScraper.Products("AKIAII3SGRXBJDPCHSGQ", "B92xTbNBTYygbGs98w01nFQUhbec1pNCkCsKVfpg", "AF6E3O0VE0X4D")
23
marketplaceId = 'A21TJRUUN4KGV'
14325 kshitij.so 24
 
16869 kshitij.so 25
SOURCE_MAP = {'AMAZON':1,'FLIPKART':2,'SNAPDEAL':3,'SAHOLIC':4, 'SHOPCLUES.COM':5,'PAYTM.COM':6}
16019 kshitij.so 26
 
14256 kshitij.so 27
def get_mongo_connection(host=options.mongoHost, port=27017):
13828 kshitij.so 28
    global con
29
    if con is None:
30
        print "Establishing connection %s host and port %d" %(host,port)
31
        try:
32
            con = pymongo.MongoClient(host, port)
33
        except Exception, e:
34
            print e
35
            return None
36
    return con
37
 
19185 kshitij.so 38
def getNetPriceForItem(itemId, source_id, category_id ,price):
39
    cash_back_type = 0
40
    cash_back = 0
41
    try:
42
        cashBack = getCashBack(itemId, source_id, category_id, mc, options.mongoHost)
43
        if not cashBack or cashBack.get('cash_back_status')!=1:
44
            cash_back_type = 0
45
            cash_back = 0 
46
 
47
        else:
48
            if cashBack['cash_back_type'] in (1,2):
49
 
50
                if cashBack.get('maxCashBack') is not None:
51
 
52
                    if cashBack.get('cash_back_type') ==1 and (float(cashBack.get('cash_back'))*price)/100 > cashBack.get('maxCashBack'):
53
                        cashBack['cash_back_type'] = 2
54
                        cashBack['cash_back'] = cashBack['maxCashBack']
55
                    elif cashBack.get('cash_back_type') ==2 and cashBack.get('cash_back') > cashBack.get('maxCashBack'):
56
                        cashBack['cash_back'] = cashBack['maxCashBack']
57
                    else:
58
                        pass
59
 
60
 
61
 
62
                cash_back_type = cashBack['cash_back_type']
63
                cash_back = float(cashBack['cash_back'])
64
    except Exception as cashBackEx:
65
        pass
66
 
67
    if cash_back_type ==1:
68
        return (price - float(cash_back)*price/100)
69
    elif cash_back_type ==2:
70
        return (price - cash_back)
71
    else:
72
        return price
73
 
14147 kshitij.so 74
def populate():
75
    toScrapMap = {}
14133 kshitij.so 76
    bestSellers = list(get_mongo_connection().Catalog.MasterData.find({'rank':{'$gt':0}}))
77
    for bestSeller in bestSellers: 
78
        amazonBestSellers = list(get_mongo_connection().Catalog.MasterData.find({'skuBundleId':bestSeller['skuBundleId'],'source_id':1}))
79
        for data in amazonBestSellers:
14147 kshitij.so 80
            if not toScrapMap.has_key(data['_id']):
15267 kshitij.so 81
                data['dealFlag'] = 0
82
                data['dealType'] = 0
16509 kshitij.so 83
                data['dealUrl'] = ""
14147 kshitij.so 84
                toScrapMap[data['_id']] = data
16173 kshitij.so 85
    dealFlagged = list(get_mongo_connection().Catalog.Deals.find({'source_id':1,'showDeal':1,'totalPoints':{'$gt':-100}}))
14250 kshitij.so 86
    for deal in dealFlagged:
87
        if not toScrapMap.has_key(deal['_id']):
14260 kshitij.so 88
            data = list(get_mongo_connection().Catalog.MasterData.find({'_id':deal['_id']}))
15267 kshitij.so 89
            data[0]['dealFlag'] = 0
90
            data[0]['dealType'] = 0
16509 kshitij.so 91
            data[0]['dealUrl'] = ""
14260 kshitij.so 92
            toScrapMap[deal['_id']] = data[0]
14308 kshitij.so 93
    manualDeals = list(get_mongo_connection().Catalog.ManualDeals.find({'startDate':{'$lte':to_java_date(datetime.now())},'endDate':{'$gte':to_java_date(datetime.now())},'source_id':1}))
94
    for manualDeal in manualDeals:
95
        if not toScrapMap.has_key(manualDeal['sku']):
96
            data = list(get_mongo_connection().Catalog.MasterData.find({'_id':manualDeal['sku']}))
97
            if len(data) > 0:
98
                data[0]['dealFlag'] = 1
99
                data[0]['dealType'] = manualDeal['dealType']
16509 kshitij.so 100
                data[0]['dealUrl'] = manualDeal['dealUrl']
14308 kshitij.so 101
                toScrapMap[manualDeal['sku']] = data[0]
102
        else:
103
            data = toScrapMap.get(manualDeal['sku'])
104
            data['dealFlag'] = 1
105
            data['dealType'] = manualDeal['dealType']
16509 kshitij.so 106
            data['dealUrl'] = manualDeal['dealUrl']
20311 kshitij.so 107
 
108
    count = 0
109
    temp = {}
110
    for v in toScrapMap.itervalues():
111
        print v
112
        #Lets validate identifier
113
        if len(str(v['identifier']).strip()) !=10:
114
            continue
115
        temp[str(v['identifier']).strip().upper()] = v
116
        count = count+1
117
        if count == 20:
118
            scrapeAmazon(temp)
119
            temp = {}
120
            count =0
14147 kshitij.so 121
 
122
 
20311 kshitij.so 123
def scrapeAmazon(dataMap):
124
    asinPricingMap = amScraper.get_competitive_pricing_for_asin(marketplaceId, dataMap.keys())
125
    print "asinPricingMap ",asinPricingMap
126
    for k, data in dataMap.iteritems():
127
        inStock = 0
128
        print str(data['identifier'])
129
        if data['identifier'] is None or len(data['identifier'].strip())==0:
14147 kshitij.so 130
            return
14308 kshitij.so 131
 
20311 kshitij.so 132
        if data.get('ignorePricing') ==1:
133
            print "Ignored items returning for %d"%(data['_id'])
134
            return 
14308 kshitij.so 135
 
20311 kshitij.so 136
        try:
137
            if data['priceUpdatedOn'] > to_java_date(datetime.now() - timedelta(minutes=5)):
138
                print "sku id is already updated",data['_id'] 
139
                return
140
        except:
141
            pass
19185 kshitij.so 142
 
20311 kshitij.so 143
        lowestPrice = asinPricingMap.get(k)    
144
        print lowestPrice
145
        if lowestPrice > 0:
146
            inStock = 1
147
            netPriceAfterCashBack = getNetPriceForItem(data['_id'], SOURCE_MAP.get('AMAZON'), data['category_id'], lowestPrice)
148
        else:
149
            netPriceAfterCashBack = getNetPriceForItem(data['_id'], SOURCE_MAP.get('AMAZON'), data['category_id'], data['available_price'])
13914 kshitij.so 150
 
20311 kshitij.so 151
        print lowestPrice
152
        print inStock
153
        if lowestPrice > 0:
154
            get_mongo_connection().Catalog.MasterData.update({'_id':data['_id']}, {'$set' : {'available_price':lowestPrice,'updatedOn':to_java_date(datetime.now()),'priceUpdatedOn':to_java_date(datetime.now()),'in_stock':inStock}}, multi=True)
155
            get_mongo_connection().Catalog.Deals.update({'_id':data['_id']}, {'$set' : {'available_price':lowestPrice , 'in_stock':inStock,'dealType':data['dealType'],'codAvailable':data['codAvailable'],'netPriceAfterCashBack':netPriceAfterCashBack}}, multi=True)
156
        else:
157
            get_mongo_connection().Catalog.MasterData.update({'_id':data['_id']}, {'$set' : {'updatedOn':to_java_date(datetime.now()),'in_stock':inStock,'priceUpdatedOn':to_java_date(datetime.now())}}, multi=True)
158
            get_mongo_connection().Catalog.Deals.update({'_id':data['_id']}, {'$set' : {'in_stock':inStock,'dealType':data['dealType'],'codAvailable':data['codAvailable'], 'netPriceAfterCashBack':netPriceAfterCashBack}})
159
 
160
        try:
161
            recomputeDeal(data)
162
        except:
163
            print "Unable to compute deal for ",data['skuBundleId']    
164
 
14325 kshitij.so 165
def populateNegativeDeals():
166
    negativeDeals = get_mongo_connection().Catalog.NegativeDeals.find().distinct('sku')
15267 kshitij.so 167
    mc.set("negative_deals", negativeDeals, 600)
13828 kshitij.so 168
 
16501 kshitij.so 169
#def recomputePoints(item, deal):
170
#    try:
171
#        if item.get('available_price') == deal['available_price']:
172
#            print "No need to compute points for %d , as price is still same" %(item['_id'])
173
#            raise
174
#        nlcPoints = getNlcPoints(item, deal['minNlc'], deal['maxNlc'], deal['available_price'])
175
#    except:
176
#        traceback.print_exc()
177
#        nlcPoints = deal['nlcPoints']
178
#    
179
#    bundleDealPoints = list(get_mongo_connection().Catalog.DealPoints.find({'skuBundleId':item['skuBundleId'],'startDate':{'$lte':to_java_date(datetime.now())},'endDate':{'$gte':to_java_date(datetime.now())}}))
180
#    if len(bundleDealPoints) > 0:
181
#        item['manualDealThresholdPrice'] = bundleDealPoints[0]['dealThresholdPrice']
182
#        dealPoints = bundleDealPoints[0]['dealPoints']
183
#    else:
184
#        dealPoints = 0
185
#        item['manualDealThresholdPrice'] = None
186
#    
187
#    get_mongo_connection().Catalog.Deals.update({'_id':deal['_id']},{"$set":{'totalPoints':deal['totalPoints'] - deal['nlcPoints'] + nlcPoints - deal['dealPoints'] +dealPoints , 'nlcPoints': nlcPoints, 'dealPoints': dealPoints, 'manualDealThresholdPrice': item['manualDealThresholdPrice']}})
15267 kshitij.so 188
 
189
 
190
 
191
def recomputeDeal(item):
13914 kshitij.so 192
    """Lets recompute deal for this bundle"""
16019 kshitij.so 193
    print "Recomputing for bundleId %d" %(item.get('skuBundleId'))
15267 kshitij.so 194
    skuBundleId = item['skuBundleId']
13914 kshitij.so 195
 
19185 kshitij.so 196
    similarItems = list(get_mongo_connection().Catalog.Deals.find({'skuBundleId':skuBundleId}).sort([('netPriceAfterCashBack',pymongo.ASCENDING)]))
13914 kshitij.so 197
    bestPrice = float("inf")
198
    bestOne = None
199
    toUpdate = []
16019 kshitij.so 200
    prepaidBestPrice = float("inf")
201
    prepaidBestOne = None
13914 kshitij.so 202
    for similarItem in similarItems:
16019 kshitij.so 203
        if similarItem['codAvailable'] ==1:
204
            if mc.get("negative_deals") is None:
205
                populateNegativeDeals()
16173 kshitij.so 206
            if similarItem['in_stock'] == 0  or similarItem['_id'] in mc.get("negative_deals"):
16019 kshitij.so 207
                get_mongo_connection().Catalog.Deals.update({ '_id' : similarItem['_id'] }, {'$set':{'showDeal':0, 'prepaidDeal':0 }})
208
                continue
209
            if similarItem['source_id'] == SOURCE_MAP.get('SHOPCLUES.COM') and similarItem['rank']==0:
210
                get_mongo_connection().Catalog.Deals.update({ '_id' : similarItem['_id'] }, {'$set':{'showDeal':0,'prepaidDeal':0 }})
211
                continue
19185 kshitij.so 212
            if similarItem.get('netPriceAfterCashBack') < bestPrice:
16019 kshitij.so 213
                bestOne = similarItem
19185 kshitij.so 214
                bestPrice = similarItem.get('netPriceAfterCashBack')
20347 kshitij.so 215
            elif similarItem.get('netPriceAfterCashBack') == bestPrice:
216
 
217
                try:
218
                    if (DEAL_PRIORITY.index(int(similarItem['source_id'])) > DEAL_PRIORITY.index(int(bestOne['source_id']))):
219
                        continue
220
                except:
221
                    traceback.print_exc()
222
 
16019 kshitij.so 223
                bestOne = similarItem
19185 kshitij.so 224
                bestPrice = similarItem.get('netPriceAfterCashBack')
16019 kshitij.so 225
            else:
226
                pass
13914 kshitij.so 227
        else:
16019 kshitij.so 228
            if mc.get("negative_deals") is None:
229
                populateNegativeDeals()
16173 kshitij.so 230
            if similarItem['in_stock'] == 0  or similarItem['_id'] in mc.get("negative_deals"):
16019 kshitij.so 231
                get_mongo_connection().Catalog.Deals.update({ '_id' : similarItem['_id'] }, {'$set':{'showDeal':0, 'prepaidDeal':0 }})
232
                continue
233
            if similarItem['source_id'] == SOURCE_MAP.get('SHOPCLUES.COM') and similarItem['rank']==0:
234
                get_mongo_connection().Catalog.Deals.update({ '_id' : similarItem['_id'] }, {'$set':{'showDeal':0,'prepaidDeal':0 }})
235
                continue
19185 kshitij.so 236
            if similarItem.get('netPriceAfterCashBack') < prepaidBestPrice:
16019 kshitij.so 237
                prepaidBestOne = similarItem
19185 kshitij.so 238
                prepaidBestPrice = similarItem.get('netPriceAfterCashBack')
20347 kshitij.so 239
            elif similarItem.get('netPriceAfterCashBack') == prepaidBestPrice:
240
 
241
                try:
20361 kshitij.so 242
                    if (DEAL_PRIORITY.index(int(similarItem['source_id'])) > DEAL_PRIORITY.index(int(prepaidBestOne['source_id']))):
20347 kshitij.so 243
                        continue
244
                except:
245
                    traceback.print_exc()
246
 
16019 kshitij.so 247
                prepaidBestOne = similarItem
19185 kshitij.so 248
                prepaidBestPrice = similarItem.get('netPriceAfterCashBack')
16019 kshitij.so 249
            else:
250
                pass
16026 kshitij.so 251
    if bestOne is not None or prepaidBestOne is not None:
13914 kshitij.so 252
        for similarItem in similarItems:
253
            toUpdate.append(similarItem['_id'])
16026 kshitij.so 254
        if bestOne is not None:
255
            toUpdate.remove(bestOne['_id'])
256
            get_mongo_connection().Catalog.Deals.update({ '_id' : bestOne['_id'] }, {'$set':{'showDeal':1,'prepaidDeal':0 }})
257
        if prepaidBestOne is not None:
16073 kshitij.so 258
            if bestOne is not None:
19185 kshitij.so 259
                if prepaidBestOne.get('netPriceAfterCashBack') < bestOne.get('netPriceAfterCashBack'): 
16073 kshitij.so 260
                    toUpdate.remove(prepaidBestOne['_id'])
261
                    get_mongo_connection().Catalog.Deals.update({ '_id' : prepaidBestOne['_id'] }, {'$set':{'showDeal':0,'prepaidDeal':1 }})
262
            else:
263
                toUpdate.remove(prepaidBestOne['_id'])
264
                get_mongo_connection().Catalog.Deals.update({ '_id' : prepaidBestOne['_id'] }, {'$set':{'showDeal':0,'prepaidDeal':1 }})
13914 kshitij.so 265
    if len(toUpdate) > 0:
16019 kshitij.so 266
        get_mongo_connection().Catalog.Deals.update({ '_id' : { "$in": toUpdate } }, {'$set':{'showDeal':0,'prepaidDeal':0 }},upsert=False, multi=True)
13914 kshitij.so 267
 
13828 kshitij.so 268
def main():
14147 kshitij.so 269
    populate()
13828 kshitij.so 270
 
271
if __name__=='__main__':
272
    main()