Subversion Repositories SmartDukaan

Rev

Rev 19591 | Go to most recent revision | Details | Last modification | View Log | RSS feed

Rev Author Line No. Line
19495 kshitij.so 1
from elixir import *
2
from dtr.storage.DataService import FlipkartOrders
3
from dtr.storage import DataService
4
from dtr.utils.utils import get_mongo_connection, get_mongo_connection_dtr_data, \
5
to_java_date, to_py_date
6
from cassandra.cluster import Cluster
7
import optparse
8
from datetime import datetime, timedelta, time
9
 
10
parser = optparse.OptionParser()
11
parser.add_option("-H", "--host", dest="hostname",
12
                      default="localhost",
13
                      type="string", help="The HOST where the DB server is running",
14
                      metavar="host")
15
parser.add_option("-m", "--m", dest="mongoHostDtr",
16
                      default="localhost",
17
                      type="string", help="Host where Catalog/Dtr dbs exist",
18
                      metavar="mongo_host")
19
parser.add_option("-d", "--d", dest="mongoHostDtrData",
20
                      default="localhost",
21
                      type="string", help="Host to dump data",
22
                      metavar="mongo_host_dtr_data")
23
 
24
parser.add_option("-c", "--c", dest="cassandraHost",
25
                      default="localhost",
26
                      type="string", help="Cassandra host",
27
                      metavar="cassandra_host")
28
 
29
(options, args) = parser.parse_args()
30
 
31
dtr_host = options.mongoHostDtr
32
dtr_data_host = options.mongoHostDtrData
33
db_hostname = options.hostname
34
cassandra_host = options.cassandraHost
35
 
36
cluster = Cluster([cassandra_host])
37
session_cassandra = cluster.connect()
38
session_cassandra.set_keyspace("profitmandi")
39
 
40
print dtr_host
41
print db_hostname
42
 
43
 
44
bundleMap = {}
45
 
46
class Analytics:
47
    def __init__(self, skuBundleId, sales, views, date):
48
        self.skuBundleId = skuBundleId
49
        self.sales = sales
50
        self.views = views
51
        self.date = date
52
 
53
def createViewsMap():
54
    global bundleMap
55
    #Datefield - Midnight.
56
    #start - Previous day midnight
57
    #Data stored in cassandra is in utc format
58
    date_field = (datetime.combine((datetime.now()).date(), time.min))
59
    start = to_java_date(date_field -timedelta(days=1))
60
    end = to_java_date(date_field)
61
    utc_start =  to_java_date(datetime.utcfromtimestamp((start)/1000))
62
    utc_end =  to_java_date(datetime.utcfromtimestamp((end)/1000))
63
    query = "select * from events where label='click' and time >='"+str(utc_start)+"' and time < '"+str(utc_end)+"' ALLOW FILTERING"
64
    print query
65
    result = session_cassandra.execute(query)
66
    for i in result:
67
        sku = int((i.properties)['sku'])
68
        master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'_id':sku})
69
        if master is None:
70
            continue
71
        bundleId = master['skuBundleId']
72
        if bundleMap.has_key(bundleId):
73
            obj = bundleMap.get(bundleId)
74
            obj.views = obj.views + 1 
75
        else:
76
            obj = Analytics(bundleId, 0, 1, start)
77
            bundleMap[bundleId] = obj
78
 
79
def createSalesMap():
80
    DataService.initialize(db_hostname=db_hostname)
81
    date_field = (datetime.combine((datetime.now()).date(), time.min))
82
    start = to_java_date(date_field -timedelta(days=1))
83
    end = to_java_date(date_field)
84
    all_orders = get_mongo_connection(host=dtr_host).Dtr.merchantOrder.find({'createdOnInt':{"$gte":start/1000,"$lt":end/1000}})
85
    for a in all_orders:
86
        store = a['storeId']
87
        if a.get('subOrders') is None:
88
            continue
89
        subOrders = a['subOrders']
90
        for s in subOrders:
91
            if s.get('productCode') is None:
92
                continue
93
            productCode = str(s['productCode'])
94
            qty = s['quantity']
95
            if store!=3:
96
                master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'identifier':productCode,'source_id':store})
97
            else:
98
                master = get_mongo_connection(host=dtr_host).Catalog.MasterData.find_one({'secondaryIdentifier':productCode,'source_id':store})
99
            if master is None:
100
                continue
101
            skuBundleId = master.get('skuBundleId')
102
            if bundleMap.has_key(skuBundleId):
103
                obj = bundleMap.get(skuBundleId)
104
                obj.sales = obj.sales + qty 
105
            else:
106
                obj = Analytics(skuBundleId, qty, 0, start)
107
                bundleMap[skuBundleId] = obj
108
    fk_orders = session.query(FlipkartOrders).filter(FlipkartOrders.created> to_py_date(start)).filter(FlipkartOrders.created< to_py_date(end)).all()
109
    for fk_order in fk_orders:
110
        if fk_order.catalogId is None:
111
            continue
112
        skuBundleId = fk_order.catalogId
113
        qty = fk_order.quantity
114
        if bundleMap.has_key(skuBundleId):
115
            obj = bundleMap.get(skuBundleId)
116
            obj.sales = obj.sales + qty 
117
        else:
118
            obj = Analytics(skuBundleId, qty, 0, start)
119
            bundleMap[skuBundleId] = obj
120
    session.close()
121
 
122
def commit():
123
    for v in bundleMap.values():
124
        get_mongo_connection_dtr_data().Analytics.ViewSalesData.insert(v.__dict__)
125
 
126
def main():
127
    createViewsMap()
128
    createSalesMap()
129
    commit()
130
 
131
 
132
if __name__ == '__main__':
133
    main()