1、搜集数据集
https://grouplens.org/datasets/movielens/
2、准备数据
import pandas as pd
import numpy as np
import tensorflow as tf
ratings_df = pd.read_csv('C:/Users/Administrator/PycharmProjects/myproject/ml-latest-small/ratings.csv')
#print(ratings_df.tail()) #加载ratings.csv文件
movies_df = pd.read_csv('ml-latest-small/movies.csv')
#print(movies_df.tail())# 加载movies.csv文件
movies_df['movieRow'] = movies_df.index
#print(movies_df.tail())
# # 筛选movies_df中的特征
movies_df = movies_df[['movieRow', 'movieId', 'title']]
movies_df.to_csv('moviesProcessed.csv', index = False, header=True, encoding='utf-8')
#print(movies_df.tail())#筛选好之后的movies_df文件
#将rating_df中的movieId替换为行号
ratings_df = pd.merge(ratings_df, movies_df, on=