def export_data_table(self, table, end_date, label, feature_names):
""" Save a data set as an HDF table for later reuse.
:param table: the DataFrame to save
:type table: pandas DataFrame
:param end_date: end of labeling period
:type end_date: a date format of some kind
:param label: name of the column containing labels
:type label: str
:param feature_names: names of the columns containing features
:type feature_names: list
:return: the prefix of the HDF filename
:rtype: str
"""
if type(end_date) == np.datetime64:
end_date = np.datetime_as_string(end_date,
timezone = 'local')[:10]
else:
end_date = end_date.to_datetime().date().isoformat()
file_name = self.export_metadata(end_date, label, feature_names)
file_path = '{0}/{1}.h5'.format(self.results_directory, file_name)
if not os.path.exists(file_path):
store = pd.HDFStore(file_path)
store['df'] = table
store.close()
self.upload_file_to_s3('{0}.h5'.format(file_name), 'hdf_bucket_name',
file_path)
print("uploaded hdf to s3")
return(file_name)
feature_model_grabber.py 文件源码
python
阅读 28
收藏 0
点赞 0
评论 0
评论列表
文章目录