Subversion Repositories SmartDukaan

Rev

Rev 17790 | Rev 17792 | Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
13828 kshitij.so 1
import pysolr
14186 kshitij.so 2
import pymongo
13828 kshitij.so 3
import json
14186 kshitij.so 4
import os
14243 kshitij.so 5
import optparse
14245 kshitij.so 6
import shutil
13828 kshitij.so 7
 
8
con=None
9
 
14186 kshitij.so 10
filePath = '/tmp/autosuggest.json'
11
destFilePath = '/home/kshitij/'
12
 
13828 kshitij.so 13
categoryMap = {3:'Mobiles',5:'Tablets'}
17790 kshitij.so 14
SOURCE_MAP = {1:'AMAZON',2:'FLIPKART',3:'SNAPDEAL',4:'SAHOLIC',5:"SHOPCLUES.COM",6:"PAYTM.COM",7:"HOMESHOP18.COM"}
13828 kshitij.so 15
xstr = lambda s: s or ""
16
 
14243 kshitij.so 17
parser = optparse.OptionParser()
18
parser.add_option("-m", "--m", dest="mongoHost",
19
                      default="localhost",
20
                      type="string", help="The HOST where the mongo server is running",
21
                      metavar="HOST")
14248 kshitij.so 22
parser.add_option("-s", "--s", dest="server",
23
                      default="localhost",
24
                      type="string", help="The HOST where the mongo server is running",
25
                      metavar="HOST")
14243 kshitij.so 26
 
27
(options, args) = parser.parse_args()
28
 
15067 kshitij.so 29
synonymsMap = {}
30
modelNameSynonymMap = {}
14243 kshitij.so 31
 
15067 kshitij.so 32
 
13828 kshitij.so 33
class __SkuInfo:
34
 
13931 kshitij.so 35
    def __init__(self, id, skuBundleId, brand, model_name, source_product_name, category_id, category, available_price, mrp, in_stock, \
15067 kshitij.so 36
                 source_id, store, title, thumbnail, priceUpdatedOn, brand_synonyms, model_name_synonyms):
13828 kshitij.so 37
        self.id = id
38
        self.skuBundleId = skuBundleId
39
        self.brand = brand
40
        self.model_name = model_name
13931 kshitij.so 41
        self.source_product_name = source_product_name
13828 kshitij.so 42
        self.category_id = category_id
43
        self.category = category
44
        self.available_price = available_price
45
        self.mrp = mrp
46
        self.in_stock = in_stock
47
        self.source_id = source_id
48
        self.store = store
49
        self.title= title
50
        self.thumbnail = thumbnail
13985 kshitij.so 51
        self.priceUpdatedOn = priceUpdatedOn
15067 kshitij.so 52
        self.brand_synonyms = brand_synonyms
53
        self.model_name_synonyms = model_name_synonyms
13828 kshitij.so 54
 
55
 
56
solr = pysolr.Solr("http://104.200.25.40:8080/solr/", timeout=10)
57
 
58
def pushData():
15067 kshitij.so 59
    populateBrandSynonymMap()
15068 kshitij.so 60
    populateModelNameSynonyms()
13828 kshitij.so 61
    l = []
17790 kshitij.so 62
    exception = []
14186 kshitij.so 63
    catalogMap = {}
17791 kshitij.so 64
    items = get_mongo_connection(options.mongoHost).Catalog.MasterData.find({'source_id' : { "$in": SOURCE_MAP.keys() } })
13828 kshitij.so 65
    print items.count()
66
    for item in items:
17790 kshitij.so 67
        try:
68
            title = xstr(item['brand'])+" "+xstr(item['model_name'])
69
        except:
70
            exception.append(item['_id'])
71
            continue
14186 kshitij.so 72
        if not catalogMap.has_key(str(item['skuBundleId'])+" "+title):
14204 kshitij.so 73
            catalogMap[str(item['skuBundleId'])+" "+title] = [title]
13974 kshitij.so 74
        s_info = __SkuInfo(str(item['_id']),int(item['skuBundleId']),(item['brand']),(item['model_name']),(item['source_product_name']),int(item['category_id']),categoryMap.get(item['category_id']),float(item['available_price']),float(item['mrp']),item['in_stock'], \
15067 kshitij.so 75
                        int(item['source_id']),(item['source']),title,(item['thumbnail']), long(item['priceUpdatedOn']), synonymsMap.get(item['brand'].upper()), modelNameSynonymMap.get(item['skuBundleId']))
13828 kshitij.so 76
        l.append(s_info.__dict__)
16297 kshitij.so 77
    solr.add(l,boost={'source_product_name': '2.0',})
14186 kshitij.so 78
 
17790 kshitij.so 79
 
80
    for x in exception:
81
        print x
82
 
14204 kshitij.so 83
    autoSuggestList = []
84
    for v in catalogMap.itervalues():
14214 kshitij.so 85
        autoSuggestList.append({'val':v[0]})
14186 kshitij.so 86
    PATH = os.path.expanduser(filePath)
87
    if os.path.isfile(PATH):
88
        try:
89
            os.remove(os.path.expanduser(filePath))
90
        except OSError:
91
            pass
92
    output = open(filePath, 'ab+')
14204 kshitij.so 93
    json.dump(autoSuggestList, output)
14186 kshitij.so 94
    output.close()
14248 kshitij.so 95
    if options.server !='localhost':
14244 kshitij.so 96
        try:
14248 kshitij.so 97
            os.system("scp "+filePath +" root@"+options.server+":"+destFilePath)
14244 kshitij.so 98
        except:
14245 kshitij.so 99
            shutil.copy2(filePath, destFilePath)
14186 kshitij.so 100
 
101
 
13828 kshitij.so 102
 
15067 kshitij.so 103
def populateBrandSynonymMap(): 
104
    global synonymsMap
105
    brand_synonyms = get_mongo_connection(options.mongoHost).Catalog.BrandSynonyms.find()
106
    for synonym in brand_synonyms:
107
        synonymsMap[synonym['brand'].upper()] = synonym['synonyms']
108
 
109
def populateModelNameSynonyms():
110
    global modelNameSynonymMap
111
    model_synonyms = get_mongo_connection(options.mongoHost).Catalog.ModelNameSynonyms.find()
112
    for synonym in model_synonyms:
113
        modelNameSynonymMap[synonym['skuBundleId']] = synonym['synonyms'] 
114
 
13828 kshitij.so 115
def get_mongo_connection(host='localhost', port=27017):
116
    global con
117
    if con is None:
118
        print "Establishing connection %s host and port %d" %(host,port)
119
        try:
120
            con = pymongo.MongoClient(host, port)
121
        except Exception, e:
122
            print e
123
            return None
124
    return con
14186 kshitij.so 125
 
13828 kshitij.so 126
if __name__=='__main__':
17790 kshitij.so 127
    pushData()