Update API

pockerman · pockerman · commit 1b54a8138470 · 2022-01-04T13:40:30.000Z
diff --git a/src/algorithms/a2c.py b/src/algorithms/a2c.py
@@ -41,20 +41,32 @@ def forward(self, x):
         return pol_out, val_out
 
 
+class A2CConfig(object):
+    """
+    Configuration for A2C algorithm
+    """
+
+    def __init__(self):
+        self.gamma: float = 0.99
+        self.tau: float = 1.2
+        self.n_workers: int = 1
+        self.n_iterations_per_episode: int = 100
+        self.optimizer: Optimizer = None
+        self.loss_function: LossFunction = None
+
+
 class A2C(Generic[Optimizer]):
 
-    def __init__(self, gamma: float, tau: float, n_workers: int,
-                 n_iterations: int,  optimizer: Optimizer,
-                 a2c_net: A2CNet, loss_function: LossFunction):
+    def __init__(self, config: A2CConfig, a2c_net: A2CNet):
 
-        self.gamma = gamma
-        self.tau = tau
-        self.rewards = []
-        self.n_workers = n_workers
-        self.n_iterations = n_iterations
-        self.optimizer = optimizer
+        self.gamma = config.gamma
+        self.tau = config.tau
+        self.n_workers = config.n_workers
+        self.n_iterations_per_episode = config.n_iterations_per_episode
+        self.optimizer = config.optimizer
+        self.loss_function = config.loss_function
         self.a2c_net = a2c_net
-        self.loss_function = loss_function
+        self.rewards = []
         self.name = "A2C"
 
     def _optimize_model(self):
@@ -80,7 +92,8 @@ def train(self, env: Env) -> None:
 
         observation = time_step.observation
 
-        for iteration in range(1, self.n_iterations + 1):
+        # learn over the episode
+        for iteration in range(1, self.n_iterations_per_episode + 1):
 
             # select an action
             action = self.select_action(env=env, observation=observation)
diff --git a/src/algorithms/trainer.py b/src/algorithms/trainer.py
@@ -33,5 +33,4 @@ def train(self):
             if self.configuration["update_frequency"] % episode == 0:
                 self.agent.update()
 
-
         print("{0} Training finished for agent {1}".format(INFO, self.agent.name))
diff --git a/src/datasets/dataset_wrapper.py b/src/datasets/dataset_wrapper.py
@@ -112,7 +112,12 @@ def sample_column(self):
         return self.get_column(col_name=col_names[col_idx])
 
     def apply_transform(self, transform: Transform) -> None:
-        pass
+
+        # get the column
+        column = self.get_column(col_name=transform.column_name)
+        column = transform.act(**{"data": column})
+        self.ds[transform.column_name] = column
+
 
 
 
diff --git a/src/spaces/action_space.py b/src/spaces/action_space.py
@@ -9,11 +9,16 @@ def __init__(self, n: int) -> None:
         super(ActionSpace, self).__init__(n=n)
         self.actions = []
 
+    def __getitem__(self, item):
+        return self.actions[item]
+
     def add(self, action: ActionBase) -> None:
 
         if len(self.actions) >= self.n:
             raise ValueError("Action space is saturated. You cannot add a new action")
 
+        # set a valid id for the action
+        action.idx = len(self.actions)
         self.actions.append(action)
 
     def add_may(self, *actions) -> None:
diff --git a/src/spaces/actions.py b/src/spaces/actions.py
@@ -33,8 +33,11 @@ class ActionBase(metaclass=abc.ABCMeta):
     Base class for actions
     """
 
-    def __init__(self, action_type: ActionType) -> None:
+    def __init__(self, column_name: str, action_type: ActionType) -> None:
+        self.column_name = column_name
         self.action_type = action_type
+        self.idx = None
+        self.key = (self.column_name, self.action_type)
 
     @abc.abstractmethod
     def act(self, **ops) -> None:
@@ -77,8 +80,8 @@ class ActionIdentity(ActionBase):
     Implements the identity action
     """
 
-    def __init__(self) -> None:
-        super(ActionIdentity, self).__init__(action_type=ActionType.IDENTITY)
+    def __init__(self, column_name: str) -> None:
+        super(ActionIdentity, self).__init__(column_name=column_name, action_type=ActionType.IDENTITY)
 
     def act(self, **ops):
         """
@@ -93,8 +96,8 @@ class ActionTransform(ActionBase):
     """
     Implements the transform action
     """
-    def __init__(self):
-        super(ActionTransform, self).__init__(action_type=ActionType.TRANSFORM)
+    def __init__(self, column_name: str):
+        super(ActionTransform, self).__init__(column_name=column_name, action_type=ActionType.TRANSFORM)
 
     def act(self, **ops):
         """
@@ -109,8 +112,8 @@ class ActionSuppress(ActionBase, _WithTable):
     """
     Implements the suppress action
     """
-    def __init__(self, suppress_table=None):
-        super(ActionSuppress, self).__init__(action_type=ActionType.SUPPRESS)
+    def __init__(self, column_name: str, suppress_table=None):
+        super(ActionSuppress, self).__init__(column_name=column_name, action_type=ActionType.SUPPRESS)
 
         if suppress_table is not None:
             self.table = suppress_table
@@ -136,36 +139,47 @@ def act(self, **ops) -> None:
         move_next(iterators=self.iterators)
 
 
-class ActionGeneralize(ActionBase):
+class ActionGeneralize(ActionBase, _WithTable):
     """
     Implements the generalization action
     """
 
-    def __init__(self):
-        super(ActionGeneralize, self).__init__(action_type=ActionType.GENERALIZE)
-        self.generalization_table = {}
+    def __init__(self, column_name: str, generalization_table: dict = None):
+        super(ActionGeneralize, self).__init__(column_name=column_name, action_type=ActionType.GENERALIZE)
+
+        if generalization_table is not None:
+            self.table = generalization_table
+
+        # fill in the iterators
+        self.iterators = [iter(self.table[item]) for item in self.table]
 
     def act(self, **ops):
         """
         Perform an action
         :return:
         """
+
+        # get the values of the column
+        col_vals = ops['data'].values
+
         # generalize the data given
-        for item in ops["data"]:
+        for i, item in enumerate(col_vals):
 
+            #print(item)
             # How do we update the generalizations?
-            value = self.generalization_table[item].value
-            item = value
+            value = self.table[item].value
+            col_vals[i] = value
 
-        # update the generalization
-        self._move_next()
+        ops["data"] = col_vals
 
-    def add_generalization(self, key: str, values: HierarchyBase) -> None:
-        self.generalization_table[key] = values
+        # update the generalization iterators
+        # so next time we visit we update according to
+        # the new values
+        move_next(iterators=self.iterators)
+        return ops['data']
 
-    def _move_next(self):
+    def add_generalization(self, key: str, values: HierarchyBase) -> None:
+        self.table[key] = values
 
-        for item in self.generalization_table:
-            next(self.generalization_table[item])
 
 
diff --git a/src/spaces/environment.py b/src/spaces/environment.py
@@ -12,7 +12,7 @@
 import multiprocessing as mp
 
 from src.exceptions.exceptions import Error
-from src.spaces.actions import ActionBase
+from src.spaces.actions import ActionBase, ActionType
 from src.utils.string_distance_calculator import DistanceType, TextDistanceCalculator
 
 DataSet = TypeVar("DataSet")
@@ -169,6 +169,15 @@ def reset(self, **options) -> TimeStep:
                                           observation=self.get_ds_as_tensor().float(), discount=self.gamma)
         return self.current_time_step
 
+    def apply_action(self, action: ActionBase):
+        """
+        Apply the action on the environment
+        :param action: The action to apply on the environment
+        :return:
+        """
+        # apply the transform of the data set
+        self.data_set.apply_transform(transform=action)
+
     def step(self, action: ActionBase) -> TimeStep:
         """
 
@@ -182,11 +191,21 @@ def step(self, action: ActionBase) -> TimeStep:
         `action` will be ignored.
         """
 
+        # if the action is identity don't bother
+        # doing anything
+        if action.action_type == ActionType.IDENTITY:
+            return TimeStep(step_type=StepType.MID, reward=0.0,
+                            observation=self.get_ds_as_tensor().float(), discount=self.gamma)
+
+        # apply the transform of the data set
         self.data_set.apply_transform(transform=action)
 
         # perform the action on the data set
         self.prepare_column_states()
 
+        # calculate the information leakage and establish the reward
+        # to return to the agent
+
         return TimeStep(step_type=StepType.MID, reward=0.0,
                         observation=self.get_ds_as_tensor().float(), discount=self.gamma)
 
diff --git a/src/tests/test_actions.py b/src/tests/test_actions.py
@@ -1,7 +1,7 @@
 import unittest
 
 from src.utils.default_hierarchy import DefaultHierarchy
-from src.spaces import ActionSuppress
+from src.spaces.actions import ActionSuppress
 
 
 class TestActions(unittest.TestCase):
@@ -11,7 +11,7 @@ def test_suppress_action_creation(self):
         suppress_table = {"test": DefaultHierarchy(values=["test", "tes*", "te**", "t***", "****"]),
                           "do_not_test": DefaultHierarchy(values=["do_not_test", "do_not_tes*", "do_not_te**", "do_not_t***", "do_not_****"])}
 
-        suppress_action = ActionSuppress(suppress_table=suppress_table)
+        suppress_action = ActionSuppress(column_name="none", suppress_table=suppress_table)
 
         self.assertEqual(len(suppress_action.table), 2, "Invalid table size")
 
@@ -23,7 +23,7 @@ def test_suppress_action_act(self):
                           "do_not_test": DefaultHierarchy(values=["do_not_test", "do_not_tes*",
                                                                   "do_not_te**", "do_not_t***", "do_not_****"])}
 
-        suppress_action = ActionSuppress(suppress_table=suppress_table)
+        suppress_action = ActionSuppress(column_name="none", suppress_table=suppress_table)
 
         suppress_action.act(**{"data": data})
 
diff --git a/src/tests/test_environment.py b/src/tests/test_environment.py
@@ -5,7 +5,9 @@
 
 from src.spaces.environment import Environment
 from src.spaces.action_space import ActionSpace
+from src.spaces.actions import ActionSuppress, ActionGeneralize
 from src.exceptions.exceptions import Error
+from src.utils.default_hierarchy import DefaultHierarchy
 from src.utils.string_distance_calculator import DistanceType
 from src.datasets.dataset_wrapper import PandasDSWrapper
 
@@ -33,7 +35,7 @@ def setUp(self) -> None:
                                            "drop_na": True,
                                            "change_col_vals": {"diagnosis": [('N', 0)]}})
 
-    #@pytest.mark.skip(reason="no way of currently testing this")
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_prepare_column_states_throw_Error(self):
         # specify the action space. We need to establish how these actions
         # are performed
@@ -45,7 +47,7 @@ def test_prepare_column_states_throw_Error(self):
         with pytest.raises(Error):
             env.prepare_column_states()
 
-    #@pytest.mark.skip(reason="no way of currently testing this")
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_prepare_column_states(self):
         # specify the action space. We need to establish how these actions
         # are performed
@@ -57,6 +59,7 @@ def test_prepare_column_states(self):
         env.initialize_text_distances(distance_type=DistanceType.COSINE)
         env.prepare_column_states()
 
+    @pytest.mark.skip(reason="no way of currently testing this")
     def test_get_numeric_ds(self):
         # specify the action space. We need to establish how these actions
         # are performed
@@ -74,12 +77,49 @@ def test_get_numeric_ds(self):
         shape0 = tensor.size(dim=0)
         shape1 = tensor.size(dim=1)
 
-        self.assertEqual(shape0, env.start_ds.n_rows())
-        self.assertEqual(shape1, env.start_ds.n_columns())
+        self.assertEqual(shape0, env.start_ds.n_rows)
+        self.assertEqual(shape1, env.start_ds.n_columns)
 
+    def test_apply_action(self):
+        # specify the action space. We need to establish how these actions
+        # are performed
+        action_space = ActionSpace(n=1)
+
+        generalization_table = {"Mixed White/Asian": DefaultHierarchy(values=["Mixed", ]),
+                                "Chinese": DefaultHierarchy(values=["Asian", ]),
+                                "Indian": DefaultHierarchy(values=["Asian", ]),
+                                "Mixed White/Black African": DefaultHierarchy(values=["Mixed", ]),
+                                "Black African": DefaultHierarchy(values=["Black", ]),
+                                "Asian other": DefaultHierarchy(values=["Asian", ]),
+                                "Black other": DefaultHierarchy(values=["Black", ]),
+                                "Mixed White/Black Caribbean": DefaultHierarchy(values=["Mixed", ]),
+                                "Mixed other": DefaultHierarchy(values=["Mixed", ]),
+                                "Arab": DefaultHierarchy(values=["Asian", ]),
+                                "White Irish": DefaultHierarchy(values=["White", ]),
+                                "Not stated": DefaultHierarchy(values=["Not stated"]),
+                                "White Gypsy/Traveller": DefaultHierarchy(values=["White", ]),
+                                "White British": DefaultHierarchy(values=["White", ]),
+                                "Bangladeshi": DefaultHierarchy(values=["Asian", ]),
+                                "White other": DefaultHierarchy(values=["White", ]),
+                                "Black Caribbean": DefaultHierarchy(values=["Black", ]),
+                                "Pakistani": DefaultHierarchy(values=["Asian", ])}
+
+        action_space.add(ActionGeneralize(column_name="ethnicity", generalization_table=generalization_table))
+
+        # create the environment and
+        env = Environment(data_set=self.ds, action_space=action_space, gamma=0.99, start_column="gender")
+
+        # this will update the environment
+        env.apply_action(action=action_space[0])
 
+        # test that the ethnicity column has been changed
+        # get the unique values for the ethnicity column
+        unique_col_vals = env.data_set.get_column_unique_values(col_name="ethnicity")
 
+        print(unique_col_vals)
 
+        unique_vals = ["Mixed", "Asian", "Not stated", "White", "Black"]
+        self.assertEqual(len(unique_vals), len(unique_col_vals))
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/src/utils/hierarchy_base.py b/src/utils/hierarchy_base.py
@@ -3,16 +3,16 @@
 from typing import TypeVar
 
 
-HierarchyBase = TypeVar("HierarchyBase")
+#HierarchyBase = TypeVar("HierarchyBase")
 
 
 class HierarchyBase(metaclass=abc.ABCMeta):
 
     def __init__(self):
         pass
 
-    @abc.abstractmethod
-    def read_from(self, filename: Path) -> HierarchyBase:
+    #@abc.abstractmethod
+    #def read_from(self, filename: Path) -> HierarchyBase:
         """
         Reads the values of the hierarchy from the file
         :param filename: The file to read the values of the hierarchy
diff --git a/src/utils/string_distance_calculator.py b/src/utils/string_distance_calculator.py
@@ -1,7 +1,7 @@
 import numpy as np
 import textdistance
 import enum
-from src.exceptions import Error
+from src.exceptions.exceptions import Error
 
 
 class DistanceType(enum.IntEnum):