Simple data visualization 51job

Disclaimer: This article is a blogger original article, follow the CC 4.0 BY-SA copyright agreement, reproduced, please attach the original source link and this statement.
This link: https://blog.csdn.net/lipachong/article/details/101155620

Reptile code on a blog: https: //blog.csdn.net/lipachong/article/details/101155790

#导入要用到的模块
import pandas as pd  #数据框操作
import matplotlib.pyplot as plt #绘图
import matplotlib as mpl #配置字体


mpl.rcParams['font.sans-serif'] = ['SimHei'] #这个是绘图格式,不写这个的话横坐标无法变成我们要的内容
#配置绘图风格
plt.rcParams['axes.labelsize'] = 8.
plt.rcParams['xtick.labelsize'] = 12.
plt.rcParams['ytick.labelsize'] = 12.
plt.rcParams['legend.fontsize'] =10.
plt.rcParams['figure.figsize'] = [8.,8.]

data3 = pd.read_csv('51job.csv')
#读取前面的内容
head=data3.head()
print(head)
#提取第一列的内容,第二列改成1就好,以此类推
row1=data3.iloc[:,0]
print(row1)
#查看第一行
cow1=data3.loc[0]
print(cow1)
#获取尾部信息,要多少尾部可以括号里自己写
wei=data3.tail()
print(wei)

xuewei=data3['xuewei']
print(xuewei)

#查看学历分类的状况以及计数
xuewei_count=data3['xuewei'].value_counts()
print(xuewei_count)
#因为学位列中有招多少多少人这种不规范数据,所以把带人字的数据修改
xuewei=data3['xuewei']
xueli=[]
for x in xuewei:
    if '人' in x:
        x='信息缺失'
    xueli.append(x)
data3['xuewei']=xueli

# 因为address列中出现上海-浦东新区,上海等,导致地区类别太多,所以把含有-的截取
address=data3['address']
quyu=[]
for x in address:
    if '-' in x:
        qu=x.split('-')[0]
        quyu.append(qu)
    else:
        xx=x.replace('\xa0\xa0','')
        quyu.append(xx)
data3['address']=quyu


# 查看学历分类的状况以及计数
xuewei_count=data3['xuewei'].value_counts()
print(xuewei_count)


#根据学历状况绘制柱形图↓
data3['xuewei'].value_counts().plot(kind='bar')
plt.show()   #显示图片
# 根据学历状况绘制条形图↓
data3['xuewei'].value_counts().plot(kind='barh')  #绘制倒置的条形图
plt.show()   #显示图片
#根据”工作经验“绘制条形图↓
data3['jingyan'].value_counts().plot(kind='barh')  #绘制条形图
plt.show()   #显示图片
# 根据地区绘制饼图↓
#绘制饼图
data3['address'].value_counts().plot(kind='pie',autopct='%1.2f%%')
plt.show()   #显示图片

Guess you like

Origin blog.csdn.net/lipachong/article/details/101155620