import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import json
from pandas import DataFrame, Series
unames = ['user_id', 'gender', 'age', 'occupation', 'zip']
#用read_table方式读取数据,给出分隔和names
users = pd.read_table('ch02/movielens/users.dat', sep='::', header=None, names=unames)
rnames = ['user_id', 'movie_id', 'rating', 'timestamp']
ratings = pd.read_table('ch02/movielens/ratings.dat', sep='::', header=None, names=rnames)
mnames = ['movie_id', 'title', 'genres']
movies = pd.read_table('ch02/movielens/movies.dat', sep='::', header=None, names=mnames)
#合并
data = pd.merge(pd.merge(ratings, users), movies)
#透视表
mean_ratings = data.pivot_table('rating', index='title', columns='gender', aggfunc='mean')
ratings_by_title = da
python pandas 实战 电影评分处理
最新推荐文章于 2025-03-24 21:34:03 发布
