Update API

pockerman · pockerman · commit 6d5be8ed786a · 2022-01-11T10:43:15.000Z
diff --git a/src/spaces/actions.py b/src/spaces/actions.py
@@ -46,6 +46,13 @@ def act(self, **ops) -> None:
         :return:
         """
 
+    @abc.abstractmethod
+    def get_maximum_number_of_transforms(self):
+        """
+        Returns the maximum number of transforms that the action applies
+        :return:
+        """
+
 
 def move_next(iterators: List) -> None:
     """
@@ -90,6 +97,13 @@ def act(self, **ops):
         """
         pass
 
+    def get_maximum_number_of_transforms(self):
+        """
+        Returns the maximum number of transforms that the action applies
+        :return:
+        """
+        return 1
+
 
 class ActionTransform(ActionBase):
 
@@ -106,6 +120,13 @@ def act(self, **ops):
         """
         pass
 
+    def get_maximum_number_of_transforms(self):
+        """
+        Returns the maximum number of transforms that the action applies
+        :return:
+        """
+        raise NotImplementedError("Method not implemented")
+
 
 class ActionSuppress(ActionBase, _WithTable):
 
@@ -138,6 +159,21 @@ def act(self, **ops) -> None:
         # update the generalization
         move_next(iterators=self.iterators)
 
+    def get_maximum_number_of_transforms(self):
+        """
+        Returns the maximum number of transforms that the action applies
+        :return:
+        """
+        max_transform = 0
+
+        for item in self.table:
+            size = len(self.table[item])
+
+            if size > max_transform:
+                max_transform = size
+
+        return max_transform
+
 
 class ActionGeneralize(ActionBase, _WithTable):
     """
@@ -181,5 +217,21 @@ def act(self, **ops):
     def add_generalization(self, key: str, values: HierarchyBase) -> None:
         self.table[key] = values
 
+    def get_maximum_number_of_transforms(self):
+        """
+        Returns the maximum number of transforms that the action applies
+        :return:
+        """
+        max_transform = 0
+
+        for item in self.table:
+            size = len(self.table[item])
+
+            if size > max_transform:
+                max_transform = size
+
+        return max_transform
+
+
 
 
diff --git a/src/spaces/environment.py b/src/spaces/environment.py
@@ -13,9 +13,11 @@
 
 from src.exceptions.exceptions import Error
 from src.spaces.actions import ActionBase, ActionType
+from src.spaces.state_space import StateSpace, State
 from src.utils.string_distance_calculator import DistanceType, TextDistanceCalculator
 
 DataSet = TypeVar("DataSet")
+RewardManager = TypeVar("RewardManager")
 
 _Reward = TypeVar('_Reward')
 _Discount = TypeVar('_Discount')
@@ -65,20 +67,37 @@ def last(self) -> bool:
 class Environment(object):
 
     def __init__(self, data_set, action_space,
-                 gamma: float, start_column: str, ):
+                 gamma: float, start_column: str, reward_manager: RewardManager):
         self.data_set = data_set
         self.start_ds = copy.deepcopy(data_set)
         self.current_time_step = self.start_ds
         self.action_space = action_space
         self.gamma = gamma
         self.start_column = start_column
         self.column_distances = {}
+        self.state_space = StateSpace()
         self.distance_calculator = None
+        self.reward_manager: RewardManager = reward_manager
+
+        # initialize the state space
+        self.state_space.init_from_environment(env=self)
 
     @property
     def n_features(self) -> int:
+        """
+        Returns the number of features in the dataset
+        :return:
+        """
         return self.start_ds.n_columns
 
+    @property
+    def feature_names(self) -> list:
+        """
+        Returns the feature names in the dataset
+        :return:
+        """
+        return self.start_ds.get_columns_names()
+
     @property
     def n_examples(self) -> int:
         return self.start_ds.n_rows
@@ -99,6 +118,24 @@ def initialize_text_distances(self, distance_type: DistanceType) -> None:
     def sample_action(self) -> ActionBase:
         return self.action_space.sample_and_get()
 
+    def get_column_as_tensor(self, column_name) -> torch.Tensor:
+        """
+        Returns the column in the dataset as a torch tensor
+        :param column_name:
+        :return:
+        """
+        data = {}
+
+        if self.start_ds.columns[column_name] == str:
+
+            numpy_vals = self.column_distances[column_name]
+            data[column_name] = numpy_vals
+        else:
+            data[column_name] = self.data_set.get_column(col_name=column_name).to_numpy()
+
+        target_df = pd.DataFrame(data)
+        return torch.tensor(target_df.to_numpy(), dtype=torch.float64)
+
     def get_ds_as_tensor(self) -> torch.Tensor:
 
         """
@@ -111,7 +148,6 @@ def get_ds_as_tensor(self) -> torch.Tensor:
         for col in col_names:
 
             if self.start_ds.columns[col] == str:
-                #print("col: {0} type {1}".format(col, self.start_ds.get_column_type(col_name=col)))
                 numpy_vals = self.column_distances[col]
                 data[col] = numpy_vals
             else:
@@ -195,28 +231,22 @@ def step(self, action: ActionBase) -> TimeStep:
         `action` will be ignored.
         """
 
+        # apply the action
         self.apply_action(action=action)
 
-        # if the action is identity don't bother
-        # doing anything
-        #if action.action_type == ActionType.IDENTITY:
-        #    return TimeStep(step_type=StepType.MID, reward=0.0,
-        #                    observation=self.get_ds_as_tensor().float(), discount=self.gamma)
-
-        # apply the transform of the data set
-        #self.data_set.apply_column_transform(transform=action)
+        # update the state space
+        self.state_space.update_state(state_name=action.column_name, status=action.action_type)
 
         # perform the action on the data set
         self.prepare_column_states()
 
         # calculate the information leakage and establish the reward
         # to return to the agent
+        reward = self.reward_manager.get_state_reward(self.state_space, action)
 
-        return TimeStep(step_type=StepType.MID, reward=0.0,
-                        observation=self.get_ds_as_tensor().float(), discount=self.gamma)
-
-
-
+        return TimeStep(step_type=StepType.MID, reward=reward,
+                        observation=self.get_column_as_tensor(column_name=action.column_name).float(),
+                        discount=self.gamma)
 
 
 class MultiprocessEnv(object):
diff --git a/src/tests/test_environment.py b/src/tests/test_environment.py
@@ -10,6 +10,7 @@
 from src.utils.serial_hierarchy import SerialHierarchy
 from src.utils.string_distance_calculator import DistanceType
 from src.datasets.dataset_wrapper import PandasDSWrapper
+from src.utils.reward_manager import RewardManager
 
 
 class TestEnvironment(unittest.TestCase):
@@ -20,6 +21,9 @@ def setUp(self) -> None:
         :return: None
         """
 
+        # specify the reward manager to use
+        self.reward_manager = RewardManager()
+
         # read the data
         filename = Path("../../data/mocksubjects.csv")
 
@@ -35,7 +39,26 @@ def setUp(self) -> None:
                                            "drop_na": True,
                                            "change_col_vals": {"diagnosis": [('N', 0)]}})
 
-    #@pytest.mark.skip(reason="no way of currently testing this")
+        self.generalization_table = {"Mixed White/Asian": SerialHierarchy(values=["Mixed", ]),
+                                "Chinese": SerialHierarchy(values=["Asian", ]),
+                                "Indian": SerialHierarchy(values=["Asian", ]),
+                                "Mixed White/Black African": SerialHierarchy(values=["Mixed", ]),
+                                "Black African": SerialHierarchy(values=["Black", ]),
+                                "Asian other": SerialHierarchy(values=["Asian", ]),
+                                "Black other": SerialHierarchy(values=["Black", ]),
+                                "Mixed White/Black Caribbean": SerialHierarchy(values=["Mixed", ]),
+                                "Mixed other": SerialHierarchy(values=["Mixed", ]),
+                                "Arab": SerialHierarchy(values=["Asian", ]),
+                                "White Irish": SerialHierarchy(values=["White", ]),
+                                "Not stated": SerialHierarchy(values=["Not stated"]),
+                                "White Gypsy/Traveller": SerialHierarchy(values=["White", ]),
+                                "White British": SerialHierarchy(values=["White", ]),
+                                "Bangladeshi": SerialHierarchy(values=["Asian", ]),
+                                "White other": SerialHierarchy(values=["White", ]),
+                                "Black Caribbean": SerialHierarchy(values=["Black", ]),
+                                "Pakistani": SerialHierarchy(values=["Asian", ])}
+
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_prepare_column_states_throw_Error(self):
         # specify the action space. We need to establish how these actions
         # are performed
@@ -47,7 +70,7 @@ def test_prepare_column_states_throw_Error(self):
         with pytest.raises(Error):
             env.prepare_column_states()
 
-    #@pytest.mark.skip(reason="no way of currently testing this")
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_prepare_column_states(self):
         # specify the action space. We need to establish how these actions
         # are performed
@@ -59,14 +82,15 @@ def test_prepare_column_states(self):
         env.initialize_text_distances(distance_type=DistanceType.COSINE)
         env.prepare_column_states()
 
-    #@pytest.mark.skip(reason="no way of currently testing this")
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_get_numeric_ds(self):
         # specify the action space. We need to establish how these actions
         # are performed
         action_space = ActionSpace(n=1)
 
         # create the environment and
-        env = Environment(data_set=self.ds, action_space=action_space, gamma=0.99, start_column="gender")
+        env = Environment(data_set=self.ds, action_space=action_space, gamma=0.99,
+                          start_column="gender", reward_manager=self.reward_manager)
 
         env.initialize_text_distances(distance_type=DistanceType.COSINE)
         env.prepare_column_states()
@@ -85,6 +109,7 @@ def test_apply_action(self):
         # are performed
         action_space = ActionSpace(n=1)
 
+        """
         generalization_table = {"Mixed White/Asian": SerialHierarchy(values=["Mixed", ]),
                                 "Chinese": SerialHierarchy(values=["Asian", ]),
                                 "Indian": SerialHierarchy(values=["Asian", ]),
@@ -103,11 +128,13 @@ def test_apply_action(self):
                                 "White other": SerialHierarchy(values=["White", ]),
                                 "Black Caribbean": SerialHierarchy(values=["Black", ]),
                                 "Pakistani": SerialHierarchy(values=["Asian", ])}
+        """
 
-        action_space.add(ActionGeneralize(column_name="ethnicity", generalization_table=generalization_table))
+        action_space.add(ActionGeneralize(column_name="ethnicity", generalization_table=self.generalization_table))
 
         # create the environment and
-        env = Environment(data_set=self.ds, action_space=action_space, gamma=0.99, start_column="gender")
+        env = Environment(data_set=self.ds, action_space=action_space,
+                          gamma=0.99, start_column="gender", reward_manager=self.reward_manager)
 
         # this will update the environment
         env.apply_action(action=action_space[0])
@@ -116,10 +143,29 @@ def test_apply_action(self):
         # get the unique values for the ethnicity column
         unique_col_vals = env.data_set.get_column_unique_values(col_name="ethnicity")
 
-        print(unique_col_vals)
-
         unique_vals = ["Mixed", "Asian", "Not stated", "White", "Black"]
         self.assertEqual(len(unique_vals), len(unique_col_vals))
+        self.assertEqual(unique_vals, unique_col_vals)
+
+    def test_step(self):
+        # specify the action space. We need to establish how these actions
+        # are performed
+        action_space = ActionSpace(n=1)
+        action_space.add(ActionGeneralize(column_name="ethnicity", generalization_table=self.generalization_table))
+
+        # create the environment and
+        env = Environment(data_set=self.ds, action_space=action_space,
+                          gamma=0.99, start_column="gender", reward_manager=self.reward_manager)
+
+        action = env.sample_action()
+
+        # this will update the environment
+        time_step = env.step(action=action)
+
+
+
+
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/src/utils/hierarchy_base.py b/src/utils/hierarchy_base.py
@@ -12,4 +12,5 @@
 class HierarchyBase(metaclass=abc.ABCMeta):
 
     def __init__(self):
-        pass
+        pass
+    
diff --git a/src/utils/serial_hierarchy.py b/src/utils/serial_hierarchy.py
@@ -35,6 +35,13 @@ def __next__(self):
 
         raise StopIteration
 
+    def __len__(self):
+        """
+        Returns the total number of items in the iterator
+        :return:
+        """
+        return len(self.values)
+
 
 class SerialHierarchy(HierarchyBase):
 
@@ -68,3 +75,10 @@ def value(self) -> Any:
         """
         return self.iterator.at
 
+    def __len__(self):
+        """
+        Returns the size of the hierarchy
+        :return:
+        """
+        return len(self.iterator)
+