diff --git a/src/beanmachine/minibm.py b/src/beanmachine/minibm.py
new file mode 100644
index 0000000000..0e8f4b56b1
--- /dev/null
+++ b/src/beanmachine/minibm.py
@@ -0,0 +1,258 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""
+The file contains MiniBM, a minimal implementation of Bean Machine PPL with a Metropolis
+Hastings implementation and a coin flipping model at the end. It is standalone, in that
+MiniBM does not depend on the Bean Machine framework at all. The only two dependencies
+for MiniBM are the PyTorch library and tqdm (for progress bar).
+"""
+
+from __future__ import annotations
+
+import itertools
+import random
+from collections import defaultdict
+from functools import wraps
+from typing import NamedTuple, Callable, Tuple, Dict, Optional, List, Any
+
+import torch
+import torch.distributions as dist
+from tqdm.auto import tqdm
+
+
+class RVIdentifier(NamedTuple):
+    """
+    A struct whose attributes uniquely identifies a random variable in Bean Machine.
+
+    Args:
+        wrapper: A reference to the decorated random variable function
+        args: Arguments taken by the
+    """
+
+    wrapper: Callable
+    args: Tuple
+
+    @property
+    def function(self):
+        """A pointer to the original function that returns the distribution object"""
+        return self.wrapper.__wrapped__  # calls the original function
+
+
+def random_variable(f: Callable[Any, dist.Distribution]):
+    """A decorator that convert a Python function that returns a distribution into a
+    function that evaluates to a Bean Machine random variable.
+
+    In Bean Machine, a @random_variable function can be used in two ways:
+
+    1. When being invoked outside of an inference scope, it returns an RVIdentifier
+       without evaluating the original function.
+    2. During inference, or when being invoked from another random variable, the
+       function will update the graph (if needed) and return its value at state of
+       inference.
+
+    For example::
+
+        @random_variable
+        def foo():
+            return dist.Normal(0., 1.0)
+
+        print(foo())  # RVIdentifier(wrapper=foo, args=())
+
+        @random_variable
+        def bar():
+            mean = foo()  # evaluates to value of theta() during inference
+            return dist.Normal(mean, 1.0)
+
+
+    Args:
+        f: A function that returns a PyTorch Distribution object
+    """
+
+    @wraps(f)
+    def wrapper(*args):
+        rvid = RVIdentifier(wrapper, args)
+        # Bean Machine inference methods use the World class to store and control the
+        # state of inference
+        world = get_world_context()
+        if world is None:
+            # We're not in an active inference. Return an ID for the random variable
+            return rvid
+        else:
+            # Update the graph and return current value of the random variable in world
+            return world.update_graph(rvid)
+
+    return wrapper
+
+
+RVDict = Dict[RVIdentifier, torch.Tensor]  # alias for typing
+WORLD_STACK: List[World] = []
+
+
+def get_world_context() -> Optional[World]:
+    """Returns the active World (if any) or None"""
+    return WORLD_STACK[-1] if WORLD_STACK else None
+
+
+class World:
+    """
+    A World is Bean Machine's internal representation of a state of the model. At the
+    high level, it stores a value for each of the random variables. It can also be used
+    as a context manager to control the behavior of random variables. For example::
+
+        @random_variable
+        def foo():
+            return dist.Normal(0., 1.0)
+
+        @random_variable
+        def bar():
+            return dist.Normal(foo(), 1.0)
+
+        # initialize world and add bar() and its ancesters to it
+        world = World.initialize_world([bar()])
+        world[bar()]  # returns the value of bar() in world
+        world[foo()]  # since foo() is bar()'s parent, it is also initialized in world
+
+        # World is also used within inference as a context manager to control the
+        # behavior of random variable
+        with world:
+            foo()  # returns the value of foo() in world, which equals to world[foo()]
+    """
+
+    def __init__(self, observations: Optional[RVDict] = None):
+        self.observations: RVDict = observations or {}
+        self.variables: RVDict = {}
+
+    def __getitem__(self, node: RVIdentifier) -> torch.Tensor:
+        return self.variables[node]
+
+    def __enter__(self) -> World:
+        WORLD_STACK.append(self)
+        return self
+
+    def __exit__(self, *args) -> None:
+        WORLD_STACK.pop()
+
+    def update_graph(self, node: RVIdentifier) -> torch.Tensor:
+        """Update the graphy by adding node to self (if needed) and retuurn the value
+        of node in self."""
+        if node not in self.variables:
+            # parent nodes will be invoked when calling node.get_distribution
+            distribution = self.get_distribution(node)
+            if node in self.observations:
+                self.variables[node] = self.observations[node]
+            else:
+                self.variables[node] = distribution.sample()
+        return self.variables[node]
+
+    def replace(self, values: RVDict) -> World:
+        """Return a new world where the values of the random variables are replaced by
+        the provided values"""
+        new_world = World(self.observations)
+        new_world.variables = {**self.variables, **values}
+        return new_world
+
+    def log_prob(self) -> torch.Tensor:
+        """Return the joint log prob on all random variables in the world"""
+        log_prob = torch.tensor(0.0)
+        for node, value in self.variables.items():
+            distribution = self.get_distribution(node)
+            log_prob += distribution.log_prob(value).sum()
+        return log_prob
+
+    def get_distribution(self, node: RVIdentifier) -> dist.Distribution:
+        """A utility method that activate the current world and invoke the function
+        associated with node. Bean Machine requires random variable functions to return
+        a distribution object, so this method will also return a distribution object."""
+        with self:
+            return node.function(*node.args)
+
+    @staticmethod
+    def initialize_world(
+        queries: List[RVIdentifier], observations: Optional[RVDict] = None
+    ) -> World:
+        """Initializes and returns a new world. Starting from the queries and
+        observations, the parent nodes will be added recursively to the world."""
+        observations = observations or {}
+        world = World(observations)
+        for node in itertools.chain(queries, observations):
+            world.update_graph(node)
+        return world
+
+
+class MetropolisHastings:
+    """A naive implementation of the `Metropolis-Hastings algorithm
+    <https://en.wikipedia.org/wiki/Metropolis%E2%80%93Hastings_algorithm>`_"""
+
+    def infer(
+        self,
+        queries: List[RVIdentifier],
+        observations: Optional[RVDict],
+        num_samples: int,
+    ) -> RVDict:
+        world = World.initialize_world(queries, observations)
+
+        samples = defaultdict(list)
+        # the main inference loop
+        for _ in tqdm(range(num_samples)):
+            latent_nodes = world.variables.keys() - world.observations.keys()
+            random.shuffle(latent_nodes)
+            # randomly select a node to be updated at a time
+            for node in latent_nodes:
+                proposer_distribution = world.get_distribution(node)
+                new_value = proposer_distribution.sample()
+                new_world = world.replace({node: new_value})
+                backward_distribution = new_world.get_distribution(node)
+
+                # log P(x, y)
+                old_log_prob = world.log_prob()
+                # log P(x', y)
+                new_log_prob = new_world.log_prob()
+                # log g(x'|x)
+                forward_log_prob = proposer_distribution.log_prob(new_value).sum()
+                # log g(x|x')
+                backward_log_prob = backward_distribution.log_prob(world[node]).sum()
+
+                accept_log_prob = (
+                    new_log_prob + backward_log_prob - old_log_prob - forward_log_prob
+                )
+                if torch.bernoulli(accept_log_prob.exp().clamp(max=1)):
+                    # accept the new state
+                    world = new_world
+
+            # collect the samples before moving to the next iteration
+            for node in queries:
+                samples[node].append(world[node])
+        # stack the list of tensors into a single tensor
+        samples = {node: torch.stack(samples[node]) for node in samples}
+        return samples
+
+
+def main():
+    # coin fliping model adapted from our tutorial
+    # (https://beanmachine.org/docs/overview/tutorials/Coin_flipping/CoinFlipping/)
+    @random_variable
+    def weight():
+        return dist.Beta(2, 2)
+
+    @random_variable
+    def y():
+        return dist.Bernoulli(weight()).expand((N,))
+
+    # data generation
+    true_weight = 0.75
+    true_y = dist.Bernoulli(true_weight)
+    N = 100
+    y_obs = true_y.sample((N,))
+
+    print("Head rate:", y_obs.mean())
+
+    # running inference
+    samples = MetropolisHastings().infer([weight()], {y(): y_obs}, num_samples=500)
+    print("Estimated weight of the coin:", samples[weight()].mean())
+
+
+if __name__ == "__main__":
+    main()
diff --git a/website/Makefile b/website/Makefile
index b73a7df14e..ffd9d4fa8e 100644
--- a/website/Makefile
+++ b/website/Makefile
@@ -6,7 +6,7 @@ SPHINXOPTS    ?=
 SPHINXBUILD   ?= sphinx-build
 SOURCEDIR     = ./sphinx
 MODULEDIR     = ../src/beanmachine
-MODULEIGNOREDIRS     = ../src/beanmachine/{applications,graph,tutorials}* ../src/beanmachine/ppl/{conftest.py,diagnostics,examples,experimental,inference/utils,legacy,testlib,utils}
+MODULEIGNOREDIRS     = ../src/beanmachine/{applications,graph,minibm,tutorials}* ../src/beanmachine/ppl/{conftest.py,diagnostics,examples,experimental,inference/utils,legacy,testlib,utils}
 BUILDDIR      = ./static
 ALLSPHINXOPTS = -d $(BUILDDIR)/doctrees $(SPHINXOPTS) $(SOURCEDIR)