econ-ark · sbenthall · Jun 17, 2021 · Jun 16, 2021 · Jun 16, 2021 · Jun 16, 2021
diff --git a/Documentation/CHANGELOG.md b/Documentation/CHANGELOG.md
@@ -14,6 +14,7 @@ Release Data: TBD
 
 #### Major Changes
 
+* A IndexDistribution class for representing time-indexed probability distributions [#1018](https://github.com/econ-ark/pull/1018/).
 * Adds new consumption-savings-portfolio model `RiskyContrib`, which represents an agent who can save in risky and risk-free assets but faces
 frictions to moving funds between them. To circumvent these frictions, he has access to an income-deduction scheme to accumulate risky assets.
 PR: [#832](https://github.com/econ-ark/HARK/pull/832). See [this forthcoming REMARK](https://github.com/Mv77/RiskyContrib) for the model's details.

diff --git a/HARK/ConsumptionSaving/ConsRiskyAssetModel.py b/HARK/ConsumptionSaving/ConsRiskyAssetModel.py
@@ -15,6 +15,7 @@
 
 from HARK.distribution import (
     combine_indep_dstns,
+    IndexDistribution,
     Lognormal,
     Bernoulli,
 )
@@ -90,13 +91,17 @@ def update_RiskyDstn(self):
         # Generate a discrete approximation to the risky return distribution if the
         # agent has age-varying beliefs about the risky asset
         if "RiskyAvg" in self.time_vary:
-            self.RiskyDstn = []
-            for t in range(self.T_cycle):
-                self.RiskyDstn.append(
-                    Lognormal.from_mean_std(self.RiskyAvg[t], self.RiskyStd[t]).approx(
-                        self.RiskyCount
-                    )
-                )
+            self.RiskyDstn = IndexDistribution(
+                Lognormal.from_mean_std,
+                {
+                    'mean' : self.RiskyAvg,
+                    'std' : self.RiskyStd
+                },
+                seed=self.RNG.randint(0, 2 ** 31 - 1)
+            ).approx(
+                self.RiskyCount
+            )
+
             self.add_to_time_vary("RiskyDstn")
 
         # Generate a discrete approximation to the risky return distribution if the
@@ -202,25 +207,11 @@ def get_Adjust(self):
         -------
         None
         """
-        if not ("AdjustPrb" in self.time_vary):
-
-            self.shocks["Adjust"] = Bernoulli(
-                self.AdjustPrb, seed=self.RNG.randint(0, 2 ** 31 - 1)
-            ).draw(self.AgentCount)
-
-        else:
-
-            Adjust = np.zeros(self.AgentCount)  # Initialize shock array
-            for t in range(self.T_cycle):
-                these = t == self.t_cycle
-                N = np.sum(these)
-                if N > 0:
-                    AdjustPrb = self.AdjustPrb[t - 1]
-                    Adjust[these] = Bernoulli(
-                        AdjustPrb, seed=self.RNG.randint(0, 2 ** 31 - 1)
-                    ).draw(N)
-
-            self.shocks["Adjust"] = Adjust
+        self.shocks['Adjust'] = IndexDistribution(
+            Bernoulli,
+            {'p' : self.AdjustPrb},
+            seed=self.RNG.randint(0, 2 ** 31 - 1)
+            ).draw(self.t_cycle)
 
     def initialize_sim(self):
         """

diff --git a/HARK/distribution.py b/HARK/distribution.py
@@ -8,6 +8,8 @@
 
 class Distribution:
     """
+    Base class for all probability distributions.
+
     Parameters
     ----------
     seed : int
@@ -27,6 +29,147 @@ def reset(self):
         """
         self.RNG = np.random.RandomState(self.seed)
 
+class IndexDistribution(Distribution):
+    """
+    This class provides a way to define a distribution that
+    is conditional on an index.
+
+    The current implementation combines a defined distribution
+    class (such as Bernoulli, LogNormal, etc.) with information
+    about the conditions on the parameters of the distribution.
+
+    For example, an IndexDistribution can be defined as
+    a Bernoulli distribution whose parameter p is a function of
+    a different inpute parameter.
+
+    Parameters
+    ----------
+
+    engine : Distribution class
+        A Distribution subclass.
+
+    conditional: dict
+        Information about the conditional variation
+        on the input parameters of the engine distribution.
+        Keys should match the arguments to the engine class
+        constructor.
+
+    seed : int
+        Seed for random number generator.
+    """
+    conditional = None
+    engine = None
+
+    def __init__(self, engine, conditional, seed = 0):
+        # Set up the RNG
+        super().__init__(seed)
+
+        self.conditional = conditional
+        self.engine = engine
+
+    def __getitem__(self, y):
+        # test one item to determine case handling
+        item0 = list(self.conditional.values())[0]
+
+        if type(item0) is list:
+            cond = {key : val[y] for (key, val) in self.conditional.items()}
+            return self.engine(
+                    seed=self.RNG.randint(0, 2 ** 31 - 1),
+                    **cond
+                )
+        else:
+            raise(Exception(
+                f"IndexDistribution: Unhandled case for __getitem__ access. y: {y}; conditional: {conditional}"
+                ))
+
+    def approx(self, N, **kwds):
+        """
+        Approximation of the distribution.
+
+        Parameters
+        ----------
+        N : init
+            Number of discrete points to approximate
+            continuous distribution into.
+
+        kwds: dict
+            Other keyword arguments passed to engine
+            distribution approx() method.
+
+        Returns:
+        ------------
+        dists : [DiscreteDistribution]
+            A list of DiscreteDistributions that are the
+            approximation of engine distribution under each condition.
+
+            TODO: It would be better if there were a conditional discrete
+            distribution representation. But that integrates with the
+            solution code. This implementation will return the list of
+            distributions representations expected by the solution code.
+        """
+
+        # test one item to determine case handling
+        item0 = list(self.conditional.values())[0]
+
+        if type(item0) is float:
+            # degenerate case. Treat the parameterization as constant.
+            return self.engine(
+                seed = self.RNG.randint(0, 2 ** 31 - 1),
+                **self.conditional
+                ).approx(N,**kwds)
+
+        if type(item0) is list:
+            return [self[i].approx(N,**kwds) for i, _ in enumerate(item0)]
+
+
+    def draw(self, condition):
+        """
+        Generate arrays of draws.
+        The input is an array containing the conditions.
+        The output is an array of the same length (axis 1 dimension)
+        as the conditions containing random draws of the conditional
+        distribution.
+
+        Parameters
+        ----------
+        condition : np.array
+            The input conditions to the distribution.
+
+        Returns:
+        ------------
+        draws : np.array
+        """
+        # for now, assume that all the conditionals
+        # are of the same type.
+        # this matches the HARK 'time-varying' model architecture.
+
+        # test one item to determine case handling
+        item0 = list(self.conditional.values())[0]
+
+        if type(item0) is float:
+            # degenerate case. Treat the parameterization as constant.
+            N = condition.size
+
+            return self.engine(
+                seed = self.RNG.randint(0, 2 ** 31 - 1),
+                **self.conditional
+                ).draw(N)
+
+        if type(item0) is list:
+            # conditions are indices into list
+            # somewhat convoluted sampling strategy retained
+            # for test backwards compatibility
+
+            draws = np.zeros(condition.size)
+
+            for c in np.unique(condition):
+                these = c == condition
+                N = np.sum(these)
+
+                cond = {key : val[c] for (key, val) in self.conditional.items()}
+                draws[these] = self[c].draw(N)
+
+            return draws
 
 ### CONTINUOUS DISTRIBUTIONS
 
@@ -64,7 +207,7 @@ def __init__(self, mu=0.0, sigma=1.0, seed=0):
 
     def draw(self, N):
         """
-        Generate arrays of lognormal draws. The sigma input can be a number
+        Generate arrays of lognormal draws. The sigma parameter can be a number
         or list-like.  If a number, output is a length N array of draws from the
         lognormal distribution with standard deviation sigma. If a list, output is
         a length T list whose t-th entry is a length N array of draws from the
@@ -74,8 +217,6 @@ def draw(self, N):
         ----------
         N : int
             Number of draws in each row.
-        seed : int
-            Seed for random number generator.
 
         Returns:
         ------------

diff --git a/HARK/tests/test_distribution.py b/HARK/tests/test_distribution.py
@@ -5,6 +5,7 @@
 
 from HARK.distribution import (
     Bernoulli,
+    IndexDistribution,
     DiscreteDistribution,
     Lognormal,
     MeanOneLogNormal,
@@ -152,6 +153,51 @@ def test_Uniform(self):
     def test_Bernoulli(self):
         self.assertEqual(Bernoulli().draw(1)[0], False)
 
+class IndexDistributionClassTests(unittest.TestCase):
+    """
+    Tests for distribution.py sampling distributions
+    with default seed.
+    """
+
+    def test_IndexDistribution(self):
+        cd = IndexDistribution(Bernoulli, {'p' : [.01, .5, .99]})
+
+        conditions = np.array([0,0,0,0,1,1,1,1,1,1,1,1,2,2,2,2])
+
+        draws = cd.draw(conditions)
+
+        self.assertEqual(draws[:4].sum(), 0)
+        self.assertEqual(draws[-4:].sum(),4)
+        self.assertEqual(cd[2].p.tolist(), .99)
+
+    def test_IndexDistribution_approx(self):
+        cd = IndexDistribution(
+            Lognormal,
+            {
+                'mu' : [.01, .5, .99],
+                'sigma' : [.05, .05, .05]
+            }
+        )
+
+        approx = cd.approx(10)
+
+        draw = approx[2].draw(5)
+
+        self.assertAlmostEqual(draw[1], 2.93868620)
+
+    def test_IndexDistribution_seeds(self):
+        cd = IndexDistribution(
+            Lognormal,
+            {
+                'mu' : [1, 1],
+                'sigma' : [1, 1]
+            }
+        )
+
+        draw_0 = cd[0].draw(1).tolist()
+        draw_1 = cd[1].draw(1).tolist()
+
+        self.assertNotEqual(draw_0, draw_1)
 
 class MarkovProcessTests(unittest.TestCase):
     """