pgmpy · ankurankan · Mar 14, 2023 · Mar 14, 2023 · Mar 14, 2023 · Mar 14, 2023
diff --git a/pgmpy/models/DynamicBayesianNetwork.py b/pgmpy/models/DynamicBayesianNetwork.py
@@ -814,7 +814,7 @@ def get_constant_bn(self, t_slice=0):
         bn.add_cpds(*new_cpds)
         return bn
 
-    def fit(self, data, estimator="MLE"):
+    def fit(self, data, estimator="MLE", state_names={}, n_jobs=-1):
         """
         Learns the CPD of the model from data.
 
@@ -831,6 +831,16 @@ def fit(self, data, estimator="MLE"):
         estimator: str
             Currently only Maximum Likelihood Estimator is supported.
 
+        state_names: dict (optional)
+            A dict indicating, for each variable, the discrete set of states
+            that the variable can take. If unspecified, the observed values
+            in the data set are taken to be the only possible states.
+
+        n_jobs: int (default: -1)
+            Number of threads/processes to use for estimation. It improves speed only
+            for large networks (>100 nodes). For smaller networks might reduce
+            performance.
+
         Returns
         -------
         None: The CPDs are added to the model instance.
@@ -895,21 +905,37 @@ def fit(self, data, estimator="MLE"):
 
             # Fit or fit_update with df_slice depending on the time slice
             if t_slice == 0:
-                const_bn.fit(df_slice)
+                if state_names != {}:
+                    state_names = {
+                        **{
+                            str(var) + "_" + str(0): s for var, s in state_names.items()
+                        },
+                        **{
+                            str(var) + "_" + str(1): s for var, s in state_names.items()
+                        },
+                    }
+                const_bn.fit(df_slice, state_names=state_names, n_jobs=n_jobs)
             else:
-                const_bn.fit_update(df_slice, n_prev_samples=t_slice * n_samples)
+                const_bn.fit_update(
+                    df_slice, n_prev_samples=t_slice * n_samples, n_jobs=n_jobs
+                )
 
         cpds = []
         for cpd in const_bn.cpds:
             var_tuples = [var.rsplit("_", 1) for var in cpd.variables]
             new_vars = [DynamicNode(var, int(t)) for var, t in var_tuples]
+            state_names = {
+                var: cpd.state_names[str(var.node) + "_" + str(var.time_slice)]
+                for var in new_vars
+            }
             cpds.append(
                 TabularCPD(
                     variable=new_vars[0],
                     variable_card=cpd.variable_card,
                     values=cpd.get_values(),
                     evidence=new_vars[1:],
                     evidence_card=cpd.cardinality[1:],
+                    state_names=state_names,
                 )
             )
 

diff --git a/pgmpy/tests/test_models/test_DynamicBayesianNetwork.py b/pgmpy/tests/test_models/test_DynamicBayesianNetwork.py
@@ -429,6 +429,26 @@ def test_fit(self):
         df = pd.DataFrame(data, columns=colnames)
         model.fit(df)
 
+        self.assertTrue(model.check_model())
+        self.assertEqual(len(model.cpds), 8)
+        for cpd in model.cpds:
+            np_test.assert_almost_equal(cpd.values, 0.5, decimal=1)
+
+        model = DBN(
+            [
+                (("A", 0), ("B", 0)),
+                (("A", 0), ("C", 0)),
+                (("B", 0), ("D", 0)),
+                (("C", 0), ("D", 0)),
+                (("A", 0), ("A", 1)),
+                (("B", 0), ("B", 1)),
+                (("C", 0), ("C", 1)),
+                (("D", 0), ("D", 1)),
+            ]
+        )
+        model.fit(
+            df, state_names={"A": [0, 1, 2], "B": [0, 1, 2], "C": [0, 1], "D": [0, 1]}
+        )
         self.assertTrue(model.check_model())
         self.assertEqual(len(model.cpds), 8)
         for cpd in model.cpds: