Blame | Last modification | View Log | RSS feed
import osimport subprocessfrom datastore.DataAccessor import DataHelperimport sys"""Documentation for script runindiaplaza.pyThis is the script called by consetup.pyFirst it will run the spiders for indiaplaza dynamically (i.e for determining no of pages)Then, it will generate the csv file@param path to the folder in which spider-projects reside (:/home/gaurav/code) but start with pathsep"""ps = os.pathsepds = os.seppath = sys.argv[1]path0 = path[1:len(path)]+ds+"ScrapyDatastore"+ds+"src"path1 = path+ds+"ExtraFunctions"+ds+"src"path2 = path+ds+"filterforname"+ds+"src"path3 = path0+path1+path2os.environ['PYTHONPATH'] = path3path3 = str(os.getenv("PYTHONPATH"))path4 = path + ds+"indiaplazaScrapypass1"+ds+"src"path3 = path3 + path4os.putenv("PYTHONPATH",path3)path4 = path4.replace(ps,"")path4 = path4 + ds+"scrapy-ctl.py"#da = DataHelper()da = DataHelper()da.initxy()ct = 18da.set_extra_vars('indiaplaza_count',str(ct),'')da.set_extra_vars('indiaplaza_fails','0','')da.set_extra_vars('indiaplaza_flag','TRUE','')flag = da.get_extra_vars('indiaplaza_flag')#print flagwhile flag=='TRUE':subprocess.call(["python", path4, "crawl", "indiaplaza"])ct = ct+1da.set_extra_vars('indiaplaza_count',str(ct),'')flag = da.get_extra_vars('indiaplaza_flag')