def test_prepare_dataset(self, fetch, chamber_of_deputies):
"""
* Rename columns.
* Make `document_type` a category column.
* Rename values for `category`.
* Create `is_party_expense` column.
"""
dataset = self.subject.dataset
self.assertTrue(set(ADAPTER_COLUMNS.keys()).issubset(set(dataset.columns)))
document_types = ['bill_of_sale', 'simple_receipt', 'expense_made_abroad']
self.assertEqual(document_types,
dataset['document_type'].cat.categories.tolist())
fixture = pd.read_csv(os.path.join(self.fixtures_path, 'reimbursements.xz'))
meal_rows = fixture \
.query('subquota_description == "Congressperson meal"').index
self.assertEqual(['Meal'],
dataset.loc[meal_rows, 'category'].unique().tolist())
party_expense_rows = fixture[fixture['congressperson_id'].isnull()].index
self.assertEqual([True],
dataset.loc[party_expense_rows, 'is_party_expense'].unique().tolist())
评论列表
文章目录