def add_all_columns(group):
group = group.sort_values(timestamp_col, ascending=True)
group["event_nr"] = range(1, group.shape[0] + 1)
group["last"] = "false"
group["last"].iloc[-1] = "true"
start_date = group[timestamp_col].iloc[0]
elapsed = group[timestamp_col] - start_date
elapsed = elapsed.fillna(0)
group["elapsed"] = elapsed.apply(lambda x: float(x / np.timedelta64(1, 's'))) # s is for seconds
end_date = group[timestamp_col].iloc[-1]
tmp = end_date - group[timestamp_col]
tmp = tmp.fillna(0)
group["remtime"] = tmp.apply(lambda x: float(x / np.timedelta64(1, 's'))) # s is for seconds
dur = group[timestamp_col] - group[timestamp_col].shift(1)
dur = dur.fillna(0)
group["duration"] = dur.apply(lambda x: float(x / np.timedelta64(1, 's'))) # s is for seconds
group["weekday"] = group[timestamp_col].dt.weekday
group["hour"] = group[timestamp_col].dt.hour
return group
preprocess_PurchOrders.py 文件源码
python
阅读 29
收藏 0
点赞 0
评论 0
评论列表
文章目录