def process(file_in=PATH_FILE_IN, file_out=PATH_FILE_FINAL):
# data = pd.read_csv(file_in, dtype='str')
# data['DateTime'] = pd.to_datetime(
# data['<DTYYYYMMDD>'].map(str) + data['<TIME>'].map(str),
# format='%Y%m%d%H%M%S')
# data = data.set_index('DateTime')
# data = pd.Series(data['<CLOSE>']).map(float)
# data = data.resample('M').fillna(method='pad')
# data = preprocessing.minmax_scale(data)
# data_t = data[6:]
# data_f = data.reshape(-1, 6)
# data_f = np.array([data[i:i + 6] for i in range(data.shape[0] - 6 + 1)])
# np.save(file_out[0], data_f[:len(data_f) - 1])
# np.save(file_out[1], data_t)
data = preprocessing.minmax_scale(pd.read_pickle(
file_in)['close'])
data = data.reshape(-1, 24)
data_m = np.array([[data[i + x][0] for x in range(5)]
for i in range(len(data) - 5 + 1)])
data_m = data_m.reshape(-1, 5)
data_s = np.array([data[i + 5][0]
for i in range(len(data) - 5)])
np.save(file_out[0], data_m[:len(data_m) - 1])
np.save(file_out[1], data_s)
评论列表
文章目录