Python操作Cassandra数据库

目录


前言

安装Cassandra

安装Cassandra数据库

  1. 官网下载Cassandra压缩包
  2. 解压,并配置环境变量:
    |操作|变量名|变量值|
    |:---:|:---|:---|
    |新建|CASSANDRA_HOME|解压路径|
    |增加|PATH|解压路径\bin;|

安装Python的Cassandra依赖包

pip install cassandra

测试

C:\Users\wahaha>cassandra

Python操作Cassandra

新建keyspace和table

# -*- encoding: utf-8 -*-
# 引入Cluster模块
from cassandra.cluster import Cluster
# 引入DCAwareRoundRobinPolicy模块,可用来自定义驱动程序的行为
from cassandra.policies import DCAwareRoundRobinPolicy


# 默认本机数据库集群(IP127.0.0.1).
cluster = Cluster()
# 连接并创建一个会话
session = cluster.connect()
# 创建KeySpace;使用第一个副本放置策略,即简单策略;选择复制因子为3个副本。
session.execute('CREATE KEYSPACE test WITH replication = {'class':'SimpleStrategy', 'replication_factor' : 3};')
# 选择keyspace
session.execute('use test;')
# 创建table
session.execute('create table test.user(name text primary key, age int, email varchar);')
# 删除table
# session.execute('drop table test.user;')
# 关闭连接
cluster.shutdown()
# 查看是否关闭连接
print(cluster.is_shutdown)

查询keyspaces/tables/columns状态

# -*- encoding: utf-8 -*-
# 引入Cluster模块
from cassandra.cluster import Cluster
# 引入DCAwareRoundRobinPolicy模块,可用来自定义驱动程序的行为
from cassandra.policies import DCAwareRoundRobinPolicy


# 默认本机数据库集群(IP127.0.0.1).
cluster = Cluster()
# 连接并创建一个会话
session = cluster.connect()
# 查询keyspaces/tables/columns状态
print(cluster.metadata.keyspaces)
print('----------')
print(cluster.metadata.keyspaces['test'].tables)
print('----------')
print(cluster.metadata.keyspaces['test'].tables['user'])
print('----------')
print(cluster.metadata.keyspaces['test'].tables['user'].columns)
print('----------')
print(cluster.metadata.keyspaces['test'].tables['user'].columns['age'])
print('----------')
# 关闭连接
cluster.shutdown()
# 查看是否关闭连接
print(cluster.is_shutdown)

插入和查询表中的数据

# -*- encoding: utf-8 -*-
# 引入Cluster模块
from cassandra.cluster import Cluster
# 引入DCAwareRoundRobinPolicy模块,可用来自定义驱动程序的行为
from cassandra.policies import DCAwareRoundRobinPolicy


# 默认本机数据库集群(IP127.0.0.1).
cluster = Cluster()
# 连接并创建一个会话
session = cluster.connect()
# table中插入数据
session.execute('insert into test.user (name, age, email) values (%s, %s, %s);', ['aaa', 21, '[email protected]'])
session.execute('insert into test.user (name, age, email) values (%s, %s, %s);', ['bbb', 22, '[email protected]'])
session.execute('insert into test.user (name, age, email) values (%s, %s, %s);', ['ddd', 20, '[email protected]'])
# table中查询数据
rows = session.execute('select * from test.user;')
for row in rows:
    print(row)
# 关闭连接
cluster.shutdown()
# 查看是否关闭连接
print(cluster.is_shutdown)

连接远程数据库

# -*- encoding: utf-8 -*-
from cassandra import ConsistencyLevel
# 引入Cluster模块
from cassandra.cluster import Cluster
# 引入DCAwareRoundRobinPolicy模块,可用来自定义驱动程序的行为
# from cassandra.policies import DCAwareRoundRobinPolicy
from cassandra.auth import PlainTextAuthProvider
from cassandra.query import SimpleStatement
import pandas as pd


# 配置Cassandra集群的IP,记得改成自己的远程数据库IP哦
contact_points = ['1.1.1.1', '2.2.2.2', '3.3.3.3']
# 配置登陆Cassandra集群的账号和密码,记得改成自己知道的账号和密码
auth_provider = PlainTextAuthProvider(username='XXX', password='XXX')
# 创建一个Cassandra的cluster
cluster = Cluster(contact_points=contact_points, auth_provider=auth_provider)
# 连接并创建一个会话
session = cluster.connect()
# 定义一条cql查询语句
cql_str = 'select * from keyspace.table limit 5;'
simple_statement = SimpleStatement(cql_str,consistency_level=ConsistencyLevel.ONE)
# 对语句的执行设置超时时间为None
execute_result = session.execute(simple_statement, timeout=None)
# 获取执行结果中的原始数据
result = execute_result._current_rows
# 把结果转成DataFrame格式
result = pd.DataFrame(result)
# 把查询结果写入csv
result.to_csv('连接远程数据库.csv', mode='a', header=True)
# 关闭连接
cluster.shutdown()

猜你喜欢

转载自www.cnblogs.com/yun1233/p/10385693.html
今日推荐