def get_basic_user_fea():
user = pd.read_csv(FilePath+UserFile, encoding='gbk')
# user['age'] = user['age'].map(convert_age)
user['age']=user['age'].replace([u'16-25?',u'26-35?',u'36-45?',u'46-55?',u'56???'],[1,2,3,4,5])
user=user[((user['age']==1) |
(user['age']==2) |
( user['age']==3) |
(user['age']==4) |
(user['age']==5)|
(user['age']==-1))]
age_df = pd.get_dummies(user["age"], prefix="age")
sex_df = pd.get_dummies(user["sex"], prefix="sex")
user_lv_df = pd.get_dummies(user["user_lv_cd"], prefix="user_lv_cd")
user = pd.concat([user['user_id'], age_df, sex_df, user_lv_df], axis=1)
user.to_csv(FilePath + 'user_basic_fea.csv',index=False)
return user
#???????????????
评论列表
文章目录