| 123456789101112131415161718192021222324252627282930313233343536373839404142 |
- # coding=utf-8
- '''
- Created on 2016年3月30日
- 这个是为了临时获得新的kind的
- @author: ChenHao
- '''
- from util_common import Constant
- from pymongo.mongo_client import MongoClient
- import time
- from analysis import detailAnalysis_kind
- TimeStart = time.time()
- # 先获得现在的kind
- # cli = MongoClient("mongodb://localhost:27017/")
- cli = MongoClient(Constant.MONGODB_URL)
- db = cli.spider
- rs = db.kind_temp.find()
- kindlist = list()
- for r in rs:
- kindlist.append(r)
- # loadData = loadData_from_db.LoadDataFromDB()
- # kindlist = loadData._get_kindlist_from_db(db)
- print (kindlist)
- print (len(kindlist))
- cli.close()
- detail_analysis_kind = detailAnalysis_kind.DetailAnalysisKind(kindlist)
- cli = MongoClient(Constant.MONGODB_URL)
- db = cli.spider
- rs = db.kind_from_listpage.find({}, {"kindls": True})
- for r in rs:
- detail_analysis_kind._add_into_out_list(r["kindls"])
- db.kind_temp_1.insert_many(detail_analysis_kind.out_list)
- print (detail_analysis_kind.out_list)
- print (len(detail_analysis_kind.out_list))
- cli.close()
- TimeEnd = time.time()
- print ("耗时", TimeEnd - TimeStart)
|