Use of python operate hdfs

Python hdfs operation of the need to use hdfsthe library, installation is as follows:

pip install --user hdfs

Hadoop operation using python code is as follows:

# -*- coding: utf-8 -*-

# @Time    : 2020/3/7 18:43
# @Author  : focksor
# @Email   : [email protected]
import os

from hdfs import Client


if __name__ == '__main__':
    hdfs_ip = "192.168.232.150"
    hdfs_version = 3
    hdfs_root = "/test"
    filepath = r"C:\Users\focks\OneDrive\DevEm\VMware\iso\ubuntu-18.04.1-desktop-amd64.iso"
    hdfs_addr = "http://" + hdfs_ip + ":" + str(9870 if (hdfs_version == 3) else 90070)

    client = Client(hdfs_addr)

    print("创建文件夹")
    client.makedirs(hdfs_root)
    print(client.list("/"))

    print("上传文件")
    client.upload(hdfs_root, filepath)
    print(client.list(hdfs_root))

    print("修改文件名")
    client.rename(hdfs_root + "/ubuntu-18.04.1-desktop-amd64.iso", hdfs_root + "/ubuntu.iso")
    print(client.list(hdfs_root))

    print("下载文件")
    client.download(hdfs_root + "/ubuntu.iso", ".")
    print(os.listdir("."))

    print("删除文件")
    client.delete(hdfs_root+"/ubuntu.iso")
    print(client.list(hdfs_root))

Guess you like

Origin www.cnblogs.com/focksor/p/hdfs_operation_with_python.html