def split(self, *splits):
"""docstring for Batcher"""
data_length = len(self.x)
indexes = range(data_length)
random.shuffle(indexes)
splits = [0] + list(splits)
splits_total = sum(splits)
return (
query(splits)
.scan()
.select(lambda n: int(data_length * n / splits_total))
.then(_window, n=2)
.select(lambda (start, end): np.array(indexes[start:end]))
.select(lambda split: Data(**{k: source[split,:] for (k, source) in self.sources.iteritems()}))
.to_list()
)
评论列表
文章目录