import pymongo
class test1():
mongo_host = "192.168.31.26" #ip地址
mongo_port = 27017
mongo_db = "sa12" # 库名
mongo_coll = "rpm" # collection名
mongo_user = "admin" #账号
mongo_pwd = "pFdada" #密码
client = pymongo.MongoClient(host=mongo_host, port=mongo_port)
# client.admin.authenticate(mongo_user,mongo_pwd)
db = client[mongo_db] # 获得数据库的句柄
coll = db[mongo_coll] # 获得collection的句柄
def a(self,rs_obj):
self.coll.update({'paqu_url': rs_obj['paqu_url']}, {'$set': rs_obj}, upsert=True,
multi=False) # 向数据库插入一条记录
rs_obj = {} # 需要存储的数据
rs_obj['paqu_url'] = '123'#不重复的字段
test1.a(test1,rs_obj)
这里,我采用的是update,因为采用update可以保证不重复插入。(我是将scrapy爬取的数据存储在Mongo中)
1.安装依赖组件 pip install pymongo
2.代码
3.运行查看结果