Subversion Repositories SmartDukaan

Rev

Rev 19592 | Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
19495 kshitij.so 1
from elixir import *
2
from dtr.storage.DataService import FlipkartOrders
3
from dtr.storage import DataService
4
from dtr.utils.utils import get_mongo_connection, get_mongo_connection_dtr_data, \
5
to_java_date, to_py_date
6
from cassandra.cluster import Cluster
7
import optparse
8
from datetime import datetime, timedelta, time
9
 
10
parser = optparse.OptionParser()
11
parser.add_option("-H", "--host", dest="hostname",
12
                      default="localhost",
13
                      type="string", help="The HOST where the DB server is running",
14
                      metavar="host")
15
parser.add_option("-m", "--m", dest="mongoHostDtr",
16
                      default="localhost",
17
                      type="string", help="Host where Catalog/Dtr dbs exist",
18
                      metavar="mongo_host")
19
parser.add_option("-d", "--d", dest="mongoHostDtrData",
20
                      default="localhost",
21
                      type="string", help="Host to dump data",
22
                      metavar="mongo_host_dtr_data")
23
 
24
parser.add_option("-c", "--c", dest="cassandraHost",
25
                      default="localhost",
26
                      type="string", help="Cassandra host",
27
                      metavar="cassandra_host")
28
 
29
(options, args) = parser.parse_args()
30
 
31
dtr_host = options.mongoHostDtr
32
dtr_data_host = options.mongoHostDtrData
33
db_hostname = options.hostname
34
cassandra_host = options.cassandraHost
35
 
36
cluster = Cluster([cassandra_host])
37
session_cassandra = cluster.connect()
38
session_cassandra.set_keyspace("profitmandi")
39
 
40
print dtr_host
41
print db_hostname
42
 
43
 
44
bundleMap = {}
45
 
46
class Analytics:
47
    def __init__(self, skuBundleId, sales, views, date):
48
        self.skuBundleId = skuBundleId
49
        self.sales = sales
50
        self.views = views
51
        self.date = date
52
 
53
def createViewsMap():
54
    global bundleMap
55
    #Datefield - Midnight.
56
    #start - Previous day midnight
57
    #Data stored in cassandra is in utc format
58
    date_field = (datetime.combine((datetime.now()).date(), time.min))
59
    start = to_java_date(date_field -timedelta(days=1))
60
    end = to_java_date(date_field)
61
    utc_start =  to_java_date(datetime.utcfromtimestamp((start)/1000))
62
    utc_end =  to_java_date(datetime.utcfromtimestamp((end)/1000))
63
    query = "select * from events where label='click' and time >='"+str(utc_start)+"' and time < '"+str(utc_end)+"' ALLOW FILTERING"
64
    print query
65
    result = session_cassandra.execute(query)
66
    for i in result:
67
        sku = int((i.properties)['sku'])
68
        master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'_id':sku})
69
        if master is None:
70
            continue
71
        bundleId = master['skuBundleId']
72
        if bundleMap.has_key(bundleId):
73
            obj = bundleMap.get(bundleId)
74
            obj.views = obj.views + 1 
75
        else:
76
            obj = Analytics(bundleId, 0, 1, start)
77
            bundleMap[bundleId] = obj
78
 
79
def createSalesMap():
80
    DataService.initialize(db_hostname=db_hostname)
81
    date_field = (datetime.combine((datetime.now()).date(), time.min))
82
    start = to_java_date(date_field -timedelta(days=1))
83
    end = to_java_date(date_field)
84
    all_orders = get_mongo_connection(host=dtr_host).Dtr.merchantOrder.find({'createdOnInt':{"$gte":start/1000,"$lt":end/1000}})
85
    for a in all_orders:
86
        store = a['storeId']
87
        if a.get('subOrders') is None:
88
            continue
89
        subOrders = a['subOrders']
90
        for s in subOrders:
91
            if s.get('productCode') is None:
92
                continue
93
            productCode = str(s['productCode'])
94
            qty = s['quantity']
95
            if store!=3:
96
                master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'identifier':productCode,'source_id':store})
97
            else:
98
                master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'secondaryIdentifier':productCode,'source_id':store})
99
            if master is None:
100
                continue
101
            skuBundleId = master.get('skuBundleId')
102
            if bundleMap.has_key(skuBundleId):
103
                obj = bundleMap.get(skuBundleId)
104
                obj.sales = obj.sales + qty 
105
            else:
106
                obj = Analytics(skuBundleId, qty, 0, start)
107
                bundleMap[skuBundleId] = obj
108
    fk_orders = session.query(FlipkartOrders).filter(FlipkartOrders.created> to_py_date(start)).filter(FlipkartOrders.created< to_py_date(end)).all()
109
    for fk_order in fk_orders:
110
        if fk_order.catalogId is None:
111
            continue
112
        skuBundleId = fk_order.catalogId
113
        qty = fk_order.quantity
114
        if bundleMap.has_key(skuBundleId):
115
            obj = bundleMap.get(skuBundleId)
116
            obj.sales = obj.sales + qty 
117
        else:
118
            obj = Analytics(skuBundleId, qty, 0, start)
119
            bundleMap[skuBundleId] = obj
120
    session.close()
121
 
122
def commit():
123
    for v in bundleMap.values():
124
        get_mongo_connection_dtr_data().Analytics.ViewSalesData.insert(v.__dict__)
125
 
19591 kshitij.so 126
def assignBestSellerRanks():
127
    skuBundleRankMap = {}
128
    date_field = (datetime.combine((datetime.now()).date(), time.min))
129
    start = to_java_date(date_field -timedelta(days=30))
130
    salesData = get_mongo_connection_dtr_data().Analytics.ViewSalesData.find({'date':{"$gte":start}},{'skuBundleId':1,'sales':1})
131
    for data in salesData:
132
        if skuBundleRankMap.has_key(data['skuBundleId']):
133
            skuBundleRankMap[data['skuBundleId']] = skuBundleRankMap.get(data['skuBundleId']) + data['sales']
134
        else:
135
            skuBundleRankMap[data['skuBundleId']] = data['sales']
136
    sorted_skuBundleRankMap = sorted(skuBundleRankMap.items(), key=lambda x: x[1],reverse=True)
19593 kshitij.so 137
    get_mongo_connection(host=dtr_host).Catalog.MasterData.update({'rank':{"$gt":0},'category_id':6},{"$set":{'rank':0}},upsert=False,multi=True)
19591 kshitij.so 138
    rank = 1
139
    for i in sorted_skuBundleRankMap:
140
        if rank > 100:
141
            return
142
        master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'skuBundleId':i[0]})
143
        if master is None or master['category_id']!=6:
144
            continue
19592 kshitij.so 145
        get_mongo_connection(host=dtr_host).Catalog.MasterData.update({'skuBundleId':master['skuBundleId']},{"$set":{"rank":rank,'updatedOn':to_java_date(datetime.now())}},upsert=False,multi=True)
19591 kshitij.so 146
        rank = rank + 1
147
 
148
 
19495 kshitij.so 149
def main():
150
    createViewsMap()
151
    createSalesMap()
152
    commit()
19591 kshitij.so 153
    assignBestSellerRanks()
19495 kshitij.so 154
 
155
 
156
if __name__ == '__main__':
157
    main()