Skip to content

Commit ad454c6

Browse files
committed
Add transformer for mock data
1 parent e950a01 commit ad454c6

File tree

1 file changed

+21
-0
lines changed

1 file changed

+21
-0
lines changed
Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
import csv
2+
from pathlib import Path
3+
from src.datasets.datasets_loaders import MockSubjectsLoader
4+
5+
if __name__ == '__main__':
6+
# specify the columns to drop
7+
drop_columns = MockSubjectsLoader.FEATURES_DROP_NAMES + ["preventative_treatment", "gender",
8+
"education", "mutation_status"]
9+
MockSubjectsLoader.FEATURES_DROP_NAMES = [] # drop_columns
10+
11+
# do a salary normalization
12+
MockSubjectsLoader.NORMALIZED_COLUMNS = ["salary"]
13+
14+
# specify the columns to use
15+
MockSubjectsLoader.COLUMNS_TYPES = {"gender": str, "ethnicity": str, "education": int,
16+
"salary": float, "diagnosis": int, "preventative_treatment": str,
17+
"mutation_status": int, }
18+
ds = MockSubjectsLoader()
19+
20+
ds.save_to_csv(filename=Path("/home/alex/qi3/drl_anonymity/data/hierarchies/normalized_salary_mocksubjects.csv"),
21+
save_index=False)

0 commit comments

Comments
 (0)