K-Nearest Neighbors近邻算法(KNN)(简单版)

通过KNN算法计算唐人街探案是哪个类型的电影

import pandas as pd
import numpy as np


def fun(x, y, z, company, n):
    # 得到各行的相似度(欧式距离)
    dis = ((company.iloc[:, 0] - x) ** 2 + (company.iloc[:, 1] - y) ** 2 + (company.iloc[:, 2] - z) ** 2) ** 0.5
    # np.argsort()返回的是排序完的下标,然后返回前面n个对应的行的下标
    dis_index = np.argsort(dis)[:n]
    # 取出返回下标的电影类型
    type = company.iloc[dis_index, 3]
    # print(type)
    # 取出众数
    new_type = type.mode()
    # print(new_type)
    return new_type


# 读取文件获得数组
company = pd.read_excel(r"C:\Users\Administrator\Desktop\电影分类数据.xlsx", encoding="gbk")
# 除去名字叫电影名称和序号的两列
company.drop(labels=['电影名称', '序号'], axis=1, inplace=True)

print(fun(23, 3, 17, company, 5))

猜你喜欢

转载自blog.csdn.net/runs_after_the_wind/article/details/82889866