Skip to content

Commit cf24d73

Browse files
Add unittest with DataFrame subset and row_indices!=None for CSVDataset()
Signed-off-by: Bartosz Grabowski <[email protected]>
1 parent ee6fb86 commit cf24d73

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

tests/data/test_csv_dataset.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -186,6 +186,13 @@ def prepare_csv_file(data, filepath):
186186
self.assertEqual(len(dataset), 3)
187187
np.testing.assert_allclose([round(i, 4) for i in dataset[1]["ehr"]], [3.3333, 3.2353, 3.4000])
188188

189+
# test pre-loaded DataFrame subset with row_indices != None
190+
df = pd.read_csv(filepath1)
191+
df_subset = df.iloc[[1, 3, 4]]
192+
dataset = CSVDataset(src=df_subset, row_indices=[1, 3], col_groups={"ehr": [f"ehr_{i}" for i in range(3)]})
193+
self.assertEqual(len(dataset), 2)
194+
np.testing.assert_allclose([round(i, 4) for i in dataset[1]["ehr"]], [3.3333, 3.2353, 3.4000])
195+
189196
# test pre-loaded multiple DataFrames, join tables with kwargs
190197
dfs = [pd.read_csv(i) for i in filepaths]
191198
dataset = CSVDataset(src=dfs, on="subject_id")

0 commit comments

Comments
 (0)