diff --git a/experiments/mapper.cpp b/experiments/mapper.cpp
new file mode 100644
index 000000000..3a59d4d07
--- /dev/null
+++ b/experiments/mapper.cpp
@@ -0,0 +1,110 @@
+/* mockturtle: C++ logic network library
+ * Copyright (C) 2018-2021  EPFL
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#include <string>
+#include <vector>
+
+#include <fmt/format.h>
+#include <lorina/aiger.hpp>
+#include <lorina/genlib.hpp>
+#include <mockturtle/utils/tech_library.hpp>
+#include <mockturtle/algorithms/mapper.hpp>
+#include <mockturtle/algorithms/node_resynthesis.hpp>
+#include <mockturtle/algorithms/node_resynthesis/mig_npn.hpp>
+#include <mockturtle/io/aiger_reader.hpp>
+#include <mockturtle/io/genlib_reader.hpp>
+#include <mockturtle/networks/aig.hpp>
+#include <mockturtle/networks/klut.hpp>
+#include <mockturtle/views/depth_view.hpp>
+
+
+#include <experiments.hpp>
+
+std::string const mcnc_library =  "GATE   inv1    1 O=!a;           PIN * INV 1 999 0.9 0.3 0.9 0.3\n"
+                                  "GATE   inv2    2 O=!a;           PIN * INV 2 999 1.0 0.1 1.0 0.1\n"
+                                  "GATE   inv3    3 O=!a;           PIN * INV 3 999 1.1 0.09 1.1 0.09\n"
+                                  "GATE   inv4    4 O=!a;           PIN * INV 4 999 1.2 0.07 1.2 0.07\n"
+                                  "GATE   nand2   2 O=!(ab);        PIN * INV 1 999 1.0 0.2 1.0 0.2\n"
+                                  "GATE   nand3   3 O=!(abc);	      PIN * INV 1 999 1.1 0.3 1.1 0.3\n"
+                                  "GATE   nand4   4 O=!(abcd);      PIN * INV 1 999 1.4 0.4 1.4 0.4\n"
+                                  "GATE   nor2    2 O=!{ab};        PIN * INV 1 999 1.4 0.5 1.4 0.5\n"
+                                  "GATE   nor3    3 O=!{abc};       PIN * INV 1 999 2.4 0.7 2.4 0.7\n"
+                                  "GATE   nor4    4 O=!{abcd};      PIN * INV 1 999 3.8 1.0 3.8 1.0\n"
+                                  "GATE   and2    3 O=(ab);         PIN * NONINV 1 999 1.9 0.3 1.9 0.3\n"
+                                  "GATE   or2     3 O={ab};         PIN * NONINV 1 999 2.4 0.3 2.4 0.3\n"
+                                  "GATE   xor2a   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "#GATE  xor2b   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "GATE   xnor2a  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "#GATE  xnor2b  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "GATE   aoi21   3 O=!{(ab)c};     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   aoi22   4 O=!{(ab)(cd)};  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   oai21   3 O=!({ab}c);     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   oai22   4 O=!({ab}{cd});  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   buf     2 O=a;            PIN * NONINV 1 999 1.0 0.0 1.0 0.0\n"
+                                  "GATE   zero    0 O=0;\n"
+                                  "GATE   one     0 O=1;";
+
+int main()
+{
+  using namespace experiments;
+  using namespace mockturtle;
+
+  experiment<std::string, uint32_t, double, uint32_t, float, float, bool> exp( "mapper", "benchmark", "size", "area_after", "depth", "delay_after", "runtime", "equivalent" );
+
+  fmt::print( "[i] processing technology library\n" );
+
+  std::vector<gate> gates;
+
+  std::istringstream in( mcnc_library );
+  lorina::read_genlib( in, genlib_reader( gates ) );
+
+  tech_library_params tps;
+  tech_library<5> lib( gates, tps );
+
+  for ( auto const& benchmark : epfl_benchmarks() )
+  {
+    fmt::print( "[i] processing {}\n", benchmark );
+    aig_network aig;
+    lorina::read_aiger( benchmark_path( benchmark ), aiger_reader( aig ) );
+
+    const uint32_t size_before = aig.num_gates();
+    const uint32_t depth_before = depth_view( aig ).depth();
+
+    map_params ps;
+    ps.cut_enumeration_ps.cut_size = 5;
+    map_stats st;
+
+    auto res = tech_map( aig, lib, ps, &st );
+
+    const auto cec = benchmark == "hyp" ? true : abc_cec( res, benchmark );
+
+    exp( benchmark, size_before, st.area, depth_before, st.delay, to_seconds( st.time_total ), cec );
+  }
+
+  exp.save();
+  exp.table();
+
+  return 0;
+}
diff --git a/include/mockturtle/algorithms/cut_enumeration/exact_map_cut.hpp b/include/mockturtle/algorithms/cut_enumeration/exact_map_cut.hpp
new file mode 100644
index 000000000..18bdc3c82
--- /dev/null
+++ b/include/mockturtle/algorithms/cut_enumeration/exact_map_cut.hpp
@@ -0,0 +1,103 @@
+/* mockturtle: C++ logic network library
+ * Copyright (C) 2018-2021  EPFL
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*!
+  \file exact_map_cut.hpp
+  \brief Cut enumeration for mapping with exact synthesis
+
+  \author Alessandro Tempia Calvino
+*/
+
+#pragma once
+
+#include <algorithm>
+#include <cstdint>
+#include <iomanip>
+#include <iostream>
+#include <vector>
+
+#include "../cut_enumeration.hpp"
+
+namespace mockturtle
+{
+
+/*! \brief Cut implementation based on ABC's giaMf.c
+
+  See <a href="https://github.com/berkeley-abc/abc/blob/master/src/aig/gia/giaMf.c">giaMf.c</a> in ABC's repository.
+*/
+struct cut_enumeration_exact_map_cut
+{
+  uint32_t delay{ 0 };
+  float flow{ 0 };
+  uint8_t match_index{ 0 };
+  bool ignore{ false };
+};
+
+template<bool ComputeTruth>
+bool operator<( cut_type<ComputeTruth, cut_enumeration_exact_map_cut> const& c1, cut_type<ComputeTruth, cut_enumeration_exact_map_cut> const& c2 )
+{
+  constexpr auto eps{ 0.005f };
+  if ( c1->data.flow < c2->data.flow - eps )
+    return true;
+  if ( c1->data.flow > c2->data.flow + eps )
+    return false;
+  if ( c1->data.delay < c2->data.delay )
+    return true;
+  if ( c1->data.delay > c2->data.delay )
+    return false;
+  return c1.size() < c2.size();
+}
+
+template<>
+struct cut_enumeration_update_cut<cut_enumeration_exact_map_cut>
+{
+  template<typename Cut, typename NetworkCuts, typename Ntk>
+  static void apply( Cut& cut, NetworkCuts const& cuts, Ntk const& ntk, node<Ntk> const& n )
+  {
+    uint32_t delay{ 0 };
+    float flow = 1.0f;
+
+    for ( auto leaf : cut )
+    {
+      const auto& best_leaf_cut = cuts.cuts( leaf )[0];
+      delay = std::max( delay, best_leaf_cut->data.delay );
+      flow += best_leaf_cut->data.flow;
+    }
+
+    cut->data.delay = 1 + delay;
+    cut->data.flow = flow / ntk.fanout_size( n );
+  }
+};
+
+template<int MaxLeaves>
+std::ostream& operator<<( std::ostream& os, cut<MaxLeaves, cut_data<false, cut_enumeration_exact_map_cut>> const& c )
+{
+  os << "{ ";
+  std::copy( c.begin(), c.end(), std::ostream_iterator<uint32_t>( os, " " ) );
+  os << "}, D = " << std::setw( 3 ) << c->data.delay << " A = " << c->data.flow;
+  return os;
+}
+
+} // namespace mockturtle
diff --git a/include/mockturtle/algorithms/cut_enumeration/tech_map_cut.hpp b/include/mockturtle/algorithms/cut_enumeration/tech_map_cut.hpp
new file mode 100644
index 000000000..6c84013e8
--- /dev/null
+++ b/include/mockturtle/algorithms/cut_enumeration/tech_map_cut.hpp
@@ -0,0 +1,99 @@
+/* mockturtle: C++ logic network library
+ * Copyright (C) 2018-2021  EPFL
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*!
+  \file tech_map_cut.hpp
+  \brief Cut enumeration for technology mapping
+
+  \author Alessandro Tempia Calvino
+*/
+
+#pragma once
+
+#include <algorithm>
+#include <cstdint>
+#include <iomanip>
+#include <iostream>
+#include <vector>
+
+#include "../cut_enumeration.hpp"
+
+namespace mockturtle
+{
+
+struct cut_enumeration_tech_map_cut
+{
+  uint32_t delay{ 0 };
+  float flow{ 0 };
+  uint8_t match_index{ 0 };
+  bool ignore{ false };
+};
+
+template<bool ComputeTruth>
+bool operator<( cut_type<ComputeTruth, cut_enumeration_tech_map_cut> const& c1, cut_type<ComputeTruth, cut_enumeration_tech_map_cut> const& c2 )
+{
+  constexpr auto eps{ 0.005f };
+  if ( c1.size() < c2.size() )
+    return true;
+  if ( c1.size() > c2.size() )
+    return false;
+  if ( c1->data.delay < c2->data.delay )
+    return true;
+  if ( c1->data.delay > c2->data.delay )
+    return false;
+  return c1->data.flow < c2->data.flow - eps;
+}
+
+template<>
+struct cut_enumeration_update_cut<cut_enumeration_tech_map_cut>
+{
+  template<typename Cut, typename NetworkCuts, typename Ntk>
+  static void apply( Cut& cut, NetworkCuts const& cuts, Ntk const& ntk, node<Ntk> const& n )
+  {
+    uint32_t delay{ 0 };
+    float flow = 1.0f;
+
+    for ( auto leaf : cut )
+    {
+      const auto& best_leaf_cut = cuts.cuts( leaf )[0];
+      delay = std::max( delay, best_leaf_cut->data.delay );
+      flow += best_leaf_cut->data.flow;
+    }
+
+    cut->data.delay = 1 + delay;
+    cut->data.flow = flow / ntk.fanout_size( n );
+  }
+};
+
+template<int MaxLeaves>
+std::ostream& operator<<( std::ostream& os, cut<MaxLeaves, cut_data<false, cut_enumeration_tech_map_cut>> const& c )
+{
+  os << "{ ";
+  std::copy( c.begin(), c.end(), std::ostream_iterator<uint32_t>( os, " " ) );
+  os << "}, D = " << std::setw( 3 ) << c->data.delay << " A = " << c->data.flow;
+  return os;
+}
+
+} // namespace mockturtle
diff --git a/include/mockturtle/algorithms/mapper.hpp b/include/mockturtle/algorithms/mapper.hpp
new file mode 100644
index 000000000..5a464d31e
--- /dev/null
+++ b/include/mockturtle/algorithms/mapper.hpp
@@ -0,0 +1,2655 @@
+/* mockturtle: C++ logic network library
+ * Copyright (C) 2018-2021  EPFL
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*!
+  \file mapper.hpp
+  \brief Mapper
+
+  \author Alessandro Tempia Calvino
+*/
+
+#pragma once
+
+#include <cstdint>
+#include <limits>
+
+#include <fmt/format.h>
+
+#include "../networks/klut.hpp"
+#include "../utils/node_map.hpp"
+#include "../utils/stopwatch.hpp"
+#include "../utils/tech_library.hpp"
+#include "../views/topo_view.hpp"
+#include "cut_enumeration.hpp"
+#include "cut_enumeration/exact_map_cut.hpp"
+#include "cut_enumeration/tech_map_cut.hpp"
+
+namespace mockturtle
+{
+
+/*! \brief Parameters for lut_mapping.
+ *
+ * The data structure `lut_mapping_params` holds configurable parameters
+ * with default arguments for `lut_mapping`.
+ */
+struct map_params
+{
+  map_params()
+  {
+    cut_enumeration_ps.cut_size = 4;
+    cut_enumeration_ps.cut_limit = 25;
+    cut_enumeration_ps.minimize_truth_table = true;
+  }
+
+  /*! \brief Parameters for cut enumeration
+   *
+   * The default cut size is 4, the default cut limit is 8.
+   */
+  cut_enumeration_params cut_enumeration_ps{};
+
+  /*! \brief Required time for delay optimization. */
+  double required_time{ 0.0f };
+
+  /*! \brief Do area optimization. */
+  bool skip_delay_round{ false };
+
+  /*! \brief Number of rounds for area flow optimization. */
+  uint32_t area_flow_rounds{ 1u };
+
+  /*! \brief Number of rounds for exact area optimization. */
+  uint32_t ela_rounds{ 2u };
+
+  /*! \brief Use structural choices. */
+  bool choices{ false };
+
+  /*! \brief Be verbose. */
+  bool verbose{ false };
+};
+
+/*! \brief Statistics for mapper.
+ *
+ * The data structure `mapper_stats` provides data collected by running
+ * `mapper`.
+ */
+struct map_stats
+{
+  /*! \brief Area and delay results. */
+  double area{ 0 };
+  double delay{ 0 };
+
+  /*! \brief Runtime. */
+  stopwatch<>::duration time_mapping{ 0 };
+  stopwatch<>::duration time_total{ 0 };
+
+  /*! \brief Cut enumeration stats. */
+  cut_enumeration_stats cut_enumeration_st{};
+
+  /*! \brief Delay and area stats for each round. */
+  std::vector<std::string> round_stats{};
+
+  /*! \brief Gates usage stats. */
+  std::string gates_usage{};
+
+  /*! \brief Mapping error. */
+  bool mapping_error{ false };
+
+  void report() const
+  {
+    for ( auto const& stat : round_stats )
+    {
+      std::cout << stat;
+    }
+    std::cout << fmt::format( "[i] Area = {:>5.2f}; Delay = {:>5.2f}\n", area, delay );
+    std::cout << fmt::format( "[i] Mapping runtime = {:>5.2f} secs\n", to_seconds( time_mapping ) );
+    std::cout << fmt::format( "[i] Total runtime   = {:>5.2f} secs\n", to_seconds( time_total ) );
+    if ( !gates_usage.empty() )
+      std::cout << "[i] Gates usage report:\n"
+                << gates_usage;
+  }
+};
+
+namespace detail
+{
+
+template<unsigned NInputs>
+struct node_match_tech
+{
+  /* best gate match for positive and negative output phases */
+  supergate<NInputs> const* best_supergate[2] = { nullptr, nullptr };
+  /* fanin pin phases for both output phases */
+  uint8_t phase[2];
+  /* best cut index for both phases */
+  uint32_t best_cut[2];
+  /* node is mapped using only one phase */
+  bool same_match{ false };
+
+  /* arrival time at node output */
+  double arrival[2];
+  /* required time at node output */
+  double required[2];
+  /* area of the best matches */
+  float area[2];
+
+  /* number of references in the cover 0: pos, 1: neg, 2: pos+neg */
+  uint32_t map_refs[3];
+  /* references estimation */
+  float est_refs[3];
+  /* area flow */
+  float flows[3];
+};
+
+template<class Ntk, unsigned NInputs, typename CutData>
+class tech_map_impl
+{
+public:
+  using network_cuts_t = network_cuts<Ntk, true, CutData>;
+  using cut_t = typename network_cuts_t::cut_t;
+  using supergate_t = std::array<std::vector<supergate<NInputs>> const*, 2>;
+  using klut_map = std::unordered_map<uint32_t, std::array<signal<klut_network>, 2>>;
+
+public:
+  tech_map_impl( Ntk const& ntk, tech_library<NInputs> const& library, map_params const& ps, map_stats& st )
+      : ntk( ntk ),
+        library( library ),
+        ps( ps ),
+        st( st ),
+        node_match( ntk.size() ),
+        matches(),
+        cuts( cut_enumeration<Ntk, true, CutData>( ntk, ps.cut_enumeration_ps, &st.cut_enumeration_st ) )
+  {
+    std::tie( lib_inv_area, lib_inv_delay, lib_inv_id ) = library.get_inverter_info();
+  }
+
+  klut_network run()
+  {
+    stopwatch t( st.time_mapping );
+
+    auto [res, old2new] = initialize_map_network();
+
+    /* compute and save topological order */
+    top_order.reserve( ntk.size() );
+    topo_view<Ntk>( ntk ).foreach_node( [this]( auto n ) {
+      top_order.push_back( n );
+    } );
+
+    /* match cuts with gates */
+    compute_matches();
+
+    /* init the data structure */
+    init_nodes();
+
+    /* compute mapping for delay */
+    if ( !ps.skip_delay_round )
+    {
+      if ( !compute_mapping<false>() )
+      {
+        return res;
+      }
+    }
+
+    /* compute mapping using global area flow */
+    while ( iteration < ps.area_flow_rounds + 1 )
+    {
+      compute_required_time();
+      if ( !compute_mapping<true>() )
+      {
+        return res;
+      }
+    }
+
+    /* compute mapping using exact area */
+    while ( iteration < ps.ela_rounds + ps.area_flow_rounds + 1 )
+    {
+      compute_required_time();
+      if ( !compute_mapping_exact_area() )
+      {
+        return res;
+      }
+    }
+
+    /* generate the output network */
+    finalize_cover( res, old2new );
+
+    return res;
+  }
+
+private:
+  void init_nodes()
+  {
+    ntk.foreach_node( [this]( auto const& n, auto ) {
+      const auto index = ntk.node_to_index( n );
+      auto& node_data = node_match[index];
+
+      node_data.est_refs[0] = node_data.est_refs[1] = node_data.est_refs[2] = static_cast<float>( ntk.fanout_size( n ) );
+
+      if ( ntk.is_constant( n ) )
+      {
+        /* all terminals have flow 1.0 */
+        node_data.flows[0] = node_data.flows[1] = node_data.flows[2] = 0.0f;
+        node_data.arrival[0] = node_data.arrival[1] = 0.0f;
+        match_constants( index );
+      }
+      else if ( ntk.is_pi( n ) )
+      {
+        /* all terminals have flow 1.0 */
+        node_data.flows[0] = node_data.flows[1] = node_data.flows[2] = 0.0f;
+        node_data.arrival[0] = 0.0f;
+        /* PIs have the negative phase implemented with an inverter */
+        node_data.arrival[1] = lib_inv_delay;
+      }
+    } );
+  }
+
+  void compute_matches()
+  {
+    /* match gates */
+    ntk.foreach_gate( [&]( auto const& n ) {
+      const auto index = ntk.node_to_index( n );
+
+      std::vector<supergate_t> node_matches;
+
+      auto i = 0u;
+      for ( auto& cut : cuts.cuts( index ) )
+      {
+        /* ignore unit cut */
+        if ( cut->size() == 1 && *cut->begin() == index )
+        {
+          ( *cut )->data.ignore = true;
+          continue;
+        }
+        if ( cut->size() > NInputs )
+        {
+          /* Ignore cuts too big to be mapped using the library */
+          ( *cut )->data.ignore = true;
+          continue;
+        }
+        const auto tt = cuts.truth_table( *cut );
+        const auto fe = kitty::extend_to<NInputs>( tt );
+        auto const supergates_pos = library.get_supergates( fe );
+        auto const supergates_neg = library.get_supergates( ~fe );
+        if ( supergates_pos != nullptr || supergates_neg != nullptr )
+        {
+          supergate_t match{ supergates_pos, supergates_neg };
+
+          node_matches.push_back( match );
+          ( *cut )->data.match_index = i++;
+        }
+        else
+        {
+          /* Ignore not matched cuts */
+          ( *cut )->data.ignore = true;
+        }
+      }
+
+      matches[index] = node_matches;
+    } );
+  }
+
+  template<bool DO_AREA>
+  bool compute_mapping()
+  {
+    for ( auto const& n : top_order )
+    {
+      if ( ntk.is_constant( n ) || ntk.is_pi( n ) )
+      {
+        continue;
+      }
+
+      /* match positive phase */
+      match_phase<DO_AREA>( n, 0u );
+
+      /* match negative phase */
+      match_phase<DO_AREA>( n, 1u );
+
+      /* try to drop one phase */
+      match_drop_phase<DO_AREA, false>( n, 0 );
+    }
+
+    double area_old = area;
+    bool success = set_mapping_refs<false>();
+
+    /* round stats */
+    if ( ps.verbose )
+    {
+      std::stringstream stats{};
+      float area_gain = 0.0f;
+
+      if ( iteration != 1 )
+        area_gain = float( ( area_old - area ) / area_old * 100 );
+
+      if constexpr ( DO_AREA )
+      {
+        stats << fmt::format( "[i] AreaFlow : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      }
+      else
+      {
+        stats << fmt::format( "[i] Delay    : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      }
+      st.round_stats.push_back( stats.str() );
+    }
+
+    return success;
+  }
+
+  bool compute_mapping_exact_area()
+  {
+    for ( auto const& n : top_order )
+    {
+      if ( ntk.is_constant( n ) || ntk.is_pi( n ) )
+        continue;
+
+      auto index = ntk.node_to_index( n );
+      auto& node_data = node_match[index];
+
+      /* recursively deselect the best cut shared between
+       * the two phases if in use in the cover */
+      if ( node_data.same_match && node_data.map_refs[2] != 0 )
+      {
+        if ( node_data.best_supergate[0] != nullptr )
+          cut_deref( cuts.cuts( index )[node_data.best_cut[0]], n, 0u );
+        else
+          cut_deref( cuts.cuts( index )[node_data.best_cut[1]], n, 1u );
+      }
+
+      /* match positive phase */
+      match_phase_exact( n, 0u );
+
+      /* match negative phase */
+      match_phase_exact( n, 1u );
+
+      /* try to drop one phase */
+      match_drop_phase<true, true>( n, 0 );
+    }
+
+    double area_old = area;
+    bool success = set_mapping_refs<true>();
+
+    /* round stats */
+    if ( ps.verbose )
+    {
+      float area_gain = float( ( area_old - area ) / area_old * 100 );
+      std::stringstream stats{};
+      stats << fmt::format( "[i] Area     : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      st.round_stats.push_back( stats.str() );
+    }
+
+    return success;
+  }
+
+  template<bool ELA>
+  bool set_mapping_refs()
+  {
+    const auto coef = 1.0f / ( 2.0f + ( iteration + 1 ) * ( iteration + 1 ) );
+
+    if constexpr ( !ELA )
+    {
+      for ( auto i = 0u; i < node_match.size(); ++i )
+      {
+        node_match[i].map_refs[0] = node_match[i].map_refs[1] = node_match[i].map_refs[2] = 0u;
+      }
+    }
+
+    /* compute the current worst delay and update the mapping refs */
+    delay = 0.0f;
+    ntk.foreach_po( [this]( auto s ) {
+      const auto index = ntk.node_to_index( ntk.get_node( s ) );
+
+      if ( ntk.is_complemented( s ) )
+        delay = std::max( delay, node_match[index].arrival[1] );
+      else
+        delay = std::max( delay, node_match[index].arrival[0] );
+
+      if constexpr ( !ELA )
+      {
+        node_match[index].map_refs[2]++;
+        if ( ntk.is_complemented( s ) )
+          node_match[index].map_refs[1]++;
+        else
+          node_match[index].map_refs[0]++;
+      }
+    } );
+
+    /* compute current area and update mapping refs in top-down order */
+    area = 0.0f;
+    for ( auto it = top_order.rbegin(); it != top_order.rend(); ++it )
+    {
+      const auto index = ntk.node_to_index( *it );
+      auto& node_data = node_match[index];
+
+      /* skip constants and PIs */
+      if ( ntk.is_constant( *it ) )
+      {
+        if ( node_match[index].map_refs[2] > 0u )
+        {
+          /* if used and not available in the library launch a mapping error */
+          if ( node_data.best_supergate[0] == nullptr && node_data.best_supergate[1] == nullptr )
+          {
+            std::cerr << "[i] MAP ERROR: technology library does not contain constant gates, impossible to perform mapping" << std::endl;
+            st.mapping_error = true;
+            return false;
+          }
+        }
+        continue;
+      }
+      else if ( ntk.is_pi( *it ) )
+      {
+        if ( node_match[index].map_refs[1] > 0u )
+        {
+          /* Add inverter area over the negated fanins */
+          area += lib_inv_area;
+        }
+        continue;
+      }
+
+      /* continue if not referenced in the cover */
+      if ( node_match[index].map_refs[2] == 0u )
+        continue;
+
+      unsigned use_phase = node_data.best_supergate[0] == nullptr ? 1u : 0u;
+
+      if ( node_data.best_supergate[use_phase] == nullptr )
+      {
+        /* Library is not complete, mapping is not possible */
+        std::cerr << "[i] MAP ERROR: technology library is not complete, impossible to perform mapping" << std::endl;
+        st.mapping_error = true;
+        return false;
+      }
+
+      if ( node_data.same_match || node_data.map_refs[use_phase] > 0 )
+      {
+        if constexpr ( !ELA )
+        {
+          auto const& best_cut = cuts.cuts( index )[node_data.best_cut[use_phase]];
+          auto ctr = 0u;
+
+          for ( auto const leaf : best_cut )
+          {
+            node_match[leaf].map_refs[2]++;
+            if ( ( node_data.phase[use_phase] >> ctr++ ) & 1 )
+              node_match[leaf].map_refs[1]++;
+            else
+              node_match[leaf].map_refs[0]++;
+          }
+        }
+        area += node_data.area[use_phase];
+        if ( node_data.same_match && node_data.map_refs[use_phase ^ 1] > 0 )
+        {
+          area += lib_inv_area;
+        }
+      }
+
+      /* invert the phase */
+      use_phase = use_phase ^ 1;
+
+      /* if both phases are implemented and used */
+      if ( !node_data.same_match && node_data.map_refs[use_phase] > 0 )
+      {
+        if constexpr ( !ELA )
+        {
+          auto const& best_cut = cuts.cuts( index )[node_data.best_cut[use_phase]];
+          auto ctr = 0u;
+          for ( auto const leaf : best_cut )
+          {
+            node_match[leaf].map_refs[2]++;
+            if ( ( node_data.phase[use_phase] >> ctr++ ) & 1 )
+              node_match[leaf].map_refs[1]++;
+            else
+              node_match[leaf].map_refs[0]++;
+          }
+        }
+        area += node_data.area[use_phase];
+      }
+    }
+
+    /* blend estimated references */
+    for ( auto i = 0u; i < ntk.size(); ++i )
+    {
+      node_match[i].est_refs[2] = coef * node_match[i].est_refs[2] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[2] ) );
+      node_match[i].est_refs[1] = coef * node_match[i].est_refs[1] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[1] ) );
+      node_match[i].est_refs[0] = coef * node_match[i].est_refs[0] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[0] ) );
+    }
+
+    ++iteration;
+    return true;
+  }
+
+  void compute_required_time()
+  {
+    for ( auto i = 0u; i < node_match.size(); ++i )
+    {
+      node_match[i].required[0] = node_match[i].required[1] = std::numeric_limits<double>::max();
+    }
+
+    /* return in case of `skip_delay_round` */
+    if ( iteration == 0 )
+      return;
+
+    auto required = delay;
+
+    if ( ps.required_time != 0.0f )
+    {
+      /* Global target time constraint */
+      if ( ps.required_time < delay - epsilon )
+      {
+        if ( !ps.skip_delay_round && iteration == 1 )
+          std::cerr << fmt::format( "[i] MAP WARNING: cannot meet the target required time of {:.2f}", ps.required_time ) << std::endl;
+      }
+      else
+      {
+        required = ps.required_time;
+      }
+    }
+
+    /* set the required time at POs */
+    ntk.foreach_po( [&]( auto const& s ) {
+      const auto index = ntk.node_to_index( ntk.get_node( s ) );
+      if ( ntk.is_complemented( s ) )
+        node_match[index].required[1] = required;
+      else
+        node_match[index].required[0] = required;
+    } );
+
+    /* propagate required time to the PIs */
+    auto i = ntk.size();
+    while ( i-- > 0u )
+    {
+      const auto n = ntk.index_to_node( i );
+      if ( ntk.is_pi( n ) || ntk.is_constant( n ) )
+        break;
+
+      if ( node_match[i].map_refs[2] == 0 )
+        continue;
+
+      auto& node_data = node_match[i];
+
+      unsigned use_phase = node_data.best_supergate[0] == nullptr ? 1u : 0u;
+      unsigned other_phase = use_phase ^ 1;
+
+      assert( node_data.best_supergate[0] != nullptr || node_data.best_supergate[1] != nullptr );
+      assert( node_data.map_refs[0] || node_data.map_refs[1] );
+
+      /* propagate required time over the output inverter if present */
+      if ( node_data.same_match && node_data.map_refs[other_phase] > 0 )
+      {
+        node_data.required[use_phase] = std::min( node_data.required[use_phase], node_data.required[other_phase] - lib_inv_delay );
+      }
+
+      if ( node_data.same_match || node_data.map_refs[use_phase] > 0 )
+      {
+        auto ctr = 0u;
+        auto best_cut = cuts.cuts( i )[node_data.best_cut[use_phase]];
+        auto const& supergate = node_data.best_supergate[use_phase];
+        for ( auto leaf : best_cut )
+        {
+          auto phase = ( node_data.phase[use_phase] >> ctr ) & 1;
+          node_match[leaf].required[phase] = std::min( node_match[leaf].required[phase], node_data.required[use_phase] - supergate->tdelay[ctr] );
+          ++ctr;
+        }
+      }
+
+      if ( !node_data.same_match && node_data.map_refs[other_phase] > 0 )
+      {
+        auto ctr = 0u;
+        auto best_cut = cuts.cuts( i )[node_data.best_cut[other_phase]];
+        auto const& supergate = node_data.best_supergate[other_phase];
+        for ( auto leaf : best_cut )
+        {
+          auto phase = ( node_data.phase[other_phase] >> ctr ) & 1;
+          node_match[leaf].required[phase] = std::min( node_match[leaf].required[phase], node_data.required[other_phase] - supergate->tdelay[ctr] );
+          ++ctr;
+        }
+      }
+    }
+  }
+
+  template<bool DO_AREA>
+  void match_phase( node<Ntk> const& n, uint8_t phase )
+  {
+    double best_arrival = std::numeric_limits<double>::max();
+    double best_area_flow = std::numeric_limits<double>::max();
+    float best_area = std::numeric_limits<float>::max();
+    uint32_t best_size = UINT32_MAX;
+    uint8_t best_cut = 0u;
+    uint8_t best_phase = 0u;
+    uint8_t cut_index = 0u;
+    auto index = ntk.node_to_index( n );
+
+    auto& node_data = node_match[index];
+    auto& cut_matches = matches[index];
+    supergate<NInputs> const* best_supergate = node_data.best_supergate[phase];
+
+    /* recompute best match info */
+    if ( best_supergate != nullptr )
+    {
+      auto const& cut = cuts.cuts( index )[node_data.best_cut[phase]];
+
+      best_phase = node_data.phase[phase];
+      best_arrival = 0.0f;
+      best_area_flow = best_supergate->area + cut_leaves_flow( cut, n, phase );
+      best_area = best_supergate->area;
+      best_cut = node_data.best_cut[phase];
+      best_size = cut.size();
+
+      auto ctr = 0u;
+      for ( auto l : cut )
+      {
+        double arrival_pin = node_match[l].arrival[( best_phase >> ctr ) & 1] + best_supergate->tdelay[ctr];
+        best_arrival = std::max( best_arrival, arrival_pin );
+        ++ctr;
+      }
+    }
+
+    /* foreach cut */
+    for ( auto& cut : cuts.cuts( index ) )
+    {
+      /* trivial cuts or not matched cuts */
+      if ( ( *cut )->data.ignore )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      auto const& supergates = cut_matches[( *cut )->data.match_index];
+
+      if ( supergates[phase] == nullptr )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      /* match each gate and take the best one */
+      for ( auto const& gate : *supergates[phase] )
+      {
+        node_data.phase[phase] = gate.polarity;
+        double area_local = gate.area + cut_leaves_flow( *cut, n, phase );
+        double worst_arrival = 0.0f;
+
+        auto ctr = 0u;
+        for ( auto l : *cut )
+        {
+          double arrival_pin = node_match[l].arrival[( gate.polarity >> ctr ) & 1] + gate.tdelay[ctr];
+          worst_arrival = std::max( worst_arrival, arrival_pin );
+          ++ctr;
+        }
+
+        if constexpr ( DO_AREA )
+        {
+          if ( worst_arrival > node_data.required[phase] + epsilon )
+            continue;
+        }
+
+        if ( compare_map<DO_AREA>( worst_arrival, best_arrival, area_local, best_area_flow, cut->size(), best_size ) )
+        {
+          best_arrival = worst_arrival;
+          best_area_flow = area_local;
+          best_size = cut->size();
+          best_cut = cut_index;
+          best_area = gate.area;
+          best_phase = gate.polarity;
+          best_supergate = &gate;
+        }
+      }
+
+      ++cut_index;
+    }
+
+    node_data.flows[phase] = best_area_flow;
+    node_data.arrival[phase] = best_arrival;
+    node_data.area[phase] = best_area;
+    node_data.best_cut[phase] = best_cut;
+    node_data.phase[phase] = best_phase;
+    node_data.best_supergate[phase] = best_supergate;
+  }
+
+  void match_phase_exact( node<Ntk> const& n, uint8_t phase )
+  {
+    double best_arrival = std::numeric_limits<double>::max();
+    float best_exact_area = std::numeric_limits<float>::max();
+    float best_area = std::numeric_limits<float>::max();
+    uint32_t best_size = UINT32_MAX;
+    uint8_t best_cut = 0u;
+    uint8_t best_phase = 0u;
+    uint8_t cut_index = 0u;
+    auto index = ntk.node_to_index( n );
+
+    auto& node_data = node_match[index];
+    auto& cut_matches = matches[index];
+    supergate<NInputs> const* best_supergate = node_data.best_supergate[phase];
+
+    /* recompute best match info */
+    if ( best_supergate != nullptr )
+    {
+      auto const& cut = cuts.cuts( index )[node_data.best_cut[phase]];
+
+      best_phase = node_data.phase[phase];
+      best_arrival = 0.0f;
+      best_area = best_supergate->area;
+      best_cut = node_data.best_cut[phase];
+      best_size = cut.size();
+
+      auto ctr = 0u;
+      for ( auto l : cut )
+      {
+        double arrival_pin = node_match[l].arrival[( best_phase >> ctr ) & 1] + best_supergate->tdelay[ctr];
+        best_arrival = std::max( best_arrival, arrival_pin );
+        ++ctr;
+      }
+
+      /* if cut is implemented, remove it from the cover */
+      if ( !node_data.same_match && node_data.map_refs[phase] )
+      {
+        best_exact_area = cut_deref( cuts.cuts( index )[best_cut], n, phase );
+      }
+      else
+      {
+        best_exact_area = cut_ref( cuts.cuts( index )[best_cut], n, phase );
+        cut_deref( cuts.cuts( index )[best_cut], n, phase );
+      }
+    }
+
+    /* foreach cut */
+    for ( auto& cut : cuts.cuts( index ) )
+    {
+      /* trivial cuts or not matched cuts */
+      if ( ( *cut )->data.ignore )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      auto const& supergates = cut_matches[( *cut )->data.match_index];
+
+      if ( supergates[phase] == nullptr )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      /* match each gate and take the best one */
+      for ( auto const& gate : *supergates[phase] )
+      {
+        node_data.phase[phase] = gate.polarity;
+        node_data.area[phase] = gate.area;
+        float area_exact = cut_ref( *cut, n, phase );
+        cut_deref( *cut, n, phase );
+        double worst_arrival = 0.0f;
+
+        auto ctr = 0u;
+        for ( auto l : *cut )
+        {
+          double arrival_pin = node_match[l].arrival[( gate.polarity >> ctr ) & 1] + gate.tdelay[ctr];
+          worst_arrival = std::max( worst_arrival, arrival_pin );
+          ++ctr;
+        }
+
+        if ( worst_arrival > node_data.required[phase] + epsilon )
+          continue;
+
+        if ( compare_map<true>( worst_arrival, best_arrival, area_exact, best_exact_area, cut->size(), best_size ) )
+        {
+          best_arrival = worst_arrival;
+          best_exact_area = area_exact;
+          best_area = gate.area;
+          best_size = cut->size();
+          best_cut = cut_index;
+          best_phase = gate.polarity;
+          best_supergate = &gate;
+        }
+      }
+
+      ++cut_index;
+    }
+
+    node_data.flows[phase] = best_exact_area;
+    node_data.arrival[phase] = best_arrival;
+    node_data.area[phase] = best_area;
+    node_data.best_cut[phase] = best_cut;
+    node_data.phase[phase] = best_phase;
+    node_data.best_supergate[phase] = best_supergate;
+
+    if ( !node_data.same_match && node_data.map_refs[phase] )
+    {
+      best_exact_area = cut_ref( cuts.cuts( index )[best_cut], n, phase );
+    }
+  }
+
+  template<bool DO_AREA, bool ELA>
+  void match_drop_phase( node<Ntk> const& n, float required_margin_factor )
+  {
+    auto index = ntk.node_to_index( n );
+    auto& node_data = node_match[index];
+
+    /* compute arrival adding an inverter to the other match phase */
+    double worst_arrival_npos = node_data.arrival[1] + lib_inv_delay;
+    double worst_arrival_nneg = node_data.arrival[0] + lib_inv_delay;
+    bool use_zero = false;
+    bool use_one = false;
+
+    /* only one phase is matched */
+    if ( node_data.best_supergate[0] == nullptr )
+    {
+      set_match_complemented_phase( index, 1, worst_arrival_npos );
+      if constexpr ( ELA )
+      {
+        if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+      }
+      return;
+    }
+    else if ( node_data.best_supergate[1] == nullptr )
+    {
+      set_match_complemented_phase( index, 0, worst_arrival_nneg );
+      if constexpr ( ELA )
+      {
+        if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+      }
+      return;
+    }
+
+    /* try to use only one match to cover both phases */
+    if constexpr ( !DO_AREA )
+    {
+      /* if arrival improves matching the other phase and inserting an inverter */
+      if ( worst_arrival_npos < node_data.arrival[0] + epsilon )
+      {
+        use_one = true;
+      }
+      if ( worst_arrival_nneg < node_data.arrival[1] + epsilon )
+      {
+        use_zero = true;
+      }
+    }
+    else
+    {
+      /* check if both phases + inverter meet the required time */
+      use_zero = worst_arrival_nneg < ( node_data.required[1] + epsilon - required_margin_factor * lib_inv_delay );
+      use_one = worst_arrival_npos < ( node_data.required[0] + epsilon - required_margin_factor * lib_inv_delay );
+    }
+
+    /* condition on not used phases, evaluate a substitution during exact area recovery */
+    if constexpr ( ELA )
+    {
+      if ( iteration != 0 )
+      {
+        if ( node_data.map_refs[0] == 0 || node_data.map_refs[1] == 0 )
+        {
+          /* select the used match */
+          auto phase = 0;
+          auto nphase = 0;
+          if ( node_data.map_refs[0] == 0 )
+          {
+            phase = 1;
+            use_one = true;
+            use_zero = false;
+          }
+          else
+          {
+            nphase = 1;
+            use_one = false;
+            use_zero = true;
+          }
+          /* select the not used match instead if it leads to area improvement and doesn't violate the required time */
+          if ( node_data.arrival[nphase] + lib_inv_delay < node_data.required[phase] + epsilon )
+          {
+            auto size_phase = cuts.cuts( index )[node_data.best_cut[phase]].size();
+            auto size_nphase = cuts.cuts( index )[node_data.best_cut[nphase]].size();
+
+            if ( compare_map<DO_AREA>( node_data.arrival[nphase] + lib_inv_delay, node_data.arrival[phase], node_data.flows[nphase] + lib_inv_area, node_data.flows[phase], size_nphase, size_phase ) )
+            {
+              /* invert the choice */
+              use_zero = !use_zero;
+              use_one = !use_one;
+            }
+          }
+        }
+      }
+    }
+
+    if ( !use_zero && !use_one )
+    {
+      /* use both phases */
+      node_data.flows[0] = node_data.flows[0] / node_data.est_refs[0];
+      node_data.flows[1] = node_data.flows[1] / node_data.est_refs[1];
+      node_data.flows[2] = node_data.flows[0] + node_data.flows[1];
+      node_data.same_match = false;
+      return;
+    }
+
+    /* use area flow as a tiebreaker */
+    if ( use_zero && use_one )
+    {
+      auto size_zero = cuts.cuts( index )[node_data.best_cut[0]].size();
+      auto size_one = cuts.cuts( index )[node_data.best_cut[1]].size();
+      if ( compare_map<DO_AREA>( worst_arrival_nneg, worst_arrival_npos, node_data.flows[0], node_data.flows[1], size_zero, size_one ) )
+        use_one = false;
+      else
+        use_zero = false;
+    }
+
+    if ( use_zero )
+    {
+      if constexpr ( ELA )
+      {
+        /* set cut references */
+        if ( !node_data.same_match )
+        {
+          /* dereference the negative phase cut if in use */
+          if ( node_data.map_refs[1] > 0 )
+            cut_deref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+          /* reference the positive cut if not in use before */
+          if ( node_data.map_refs[0] == 0 && node_data.map_refs[2] )
+            cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+        }
+        else if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+      }
+      set_match_complemented_phase( index, 0, worst_arrival_nneg );
+    }
+    else
+    {
+      if constexpr ( ELA )
+      {
+        /* set cut references */
+        if ( !node_data.same_match )
+        {
+          /* dereference the positive phase cut if in use */
+          if ( node_data.map_refs[0] > 0 )
+            cut_deref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+          /* reference the negative cut if not in use before */
+          if ( node_data.map_refs[1] == 0 && node_data.map_refs[2] )
+            cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+        }
+        else if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+      }
+      set_match_complemented_phase( index, 1, worst_arrival_npos );
+    }
+  }
+
+  inline void set_match_complemented_phase( uint32_t index, uint8_t phase, double worst_arrival_n )
+  {
+    auto& node_data = node_match[index];
+    auto phase_n = phase ^ 1;
+    node_data.same_match = true;
+    node_data.best_supergate[phase_n] = nullptr;
+    node_data.best_cut[phase_n] = node_data.best_cut[phase];
+    node_data.phase[phase_n] = node_data.phase[phase];
+    node_data.arrival[phase_n] = worst_arrival_n;
+    node_data.area[phase_n] = node_data.area[phase];
+    node_data.flows[phase] = node_data.flows[phase] / node_data.est_refs[2];
+    node_data.flows[phase_n] = node_data.flows[phase];
+    node_data.flows[2] = node_data.flows[phase];
+  }
+
+  void match_constants( uint32_t index )
+  {
+    auto& node_data = node_match[index];
+
+    kitty::static_truth_table<NInputs> zero_tt;
+    auto const supergates_zero = library.get_supergates( zero_tt );
+    auto const supergates_one = library.get_supergates( ~zero_tt );
+
+    /* Not available in the library */
+    if ( supergates_zero == nullptr && supergates_one == nullptr )
+    {
+      return;
+    }
+    /* if only one is available, the other is obtained using an inverter */
+    if ( supergates_zero != nullptr )
+    {
+      node_data.best_supergate[0] = &( ( *supergates_zero )[0] );
+      node_data.arrival[0] = node_data.best_supergate[0]->worstDelay;
+      node_data.area[0] = node_data.best_supergate[0]->area;
+      node_data.phase[0] = 0;
+    }
+    if ( supergates_one != nullptr )
+    {
+      node_data.best_supergate[1] = &( ( *supergates_one )[0] );
+      node_data.arrival[1] = node_data.best_supergate[1]->worstDelay;
+      node_data.area[1] = node_data.best_supergate[1]->area;
+      node_data.phase[1] = 0;
+    }
+    else
+    {
+      node_data.same_match = true;
+      node_data.arrival[1] = node_data.arrival[0] + lib_inv_delay;
+      node_data.area[1] = node_data.area[0] + lib_inv_area;
+      node_data.phase[1] = 1;
+    }
+    if ( supergates_zero == nullptr )
+    {
+      node_data.same_match = true;
+      node_data.arrival[0] = node_data.arrival[1] + lib_inv_delay;
+      node_data.area[0] = node_data.area[1] + lib_inv_area;
+      node_data.phase[0] = 1;
+    }
+  }
+
+  inline double cut_leaves_flow( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    double flow{ 0.0f };
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+
+    uint8_t ctr = 0u;
+    for ( auto leaf : cut )
+    {
+      uint8_t leaf_phase = ( node_data.phase[phase] >> ctr++ ) & 1;
+      flow += node_match[leaf].flows[leaf_phase];
+    }
+
+    return flow;
+  }
+
+  float cut_ref( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+    float count = node_data.area[phase];
+
+    uint8_t ctr = 0;
+    for ( auto leaf : cut )
+    {
+      /* compute leaf phase using the current gate */
+      uint8_t leaf_phase = ( node_data.phase[phase] >> ctr++ ) & 1;
+
+      if ( ntk.is_constant( ntk.index_to_node( leaf ) ) )
+      {
+        continue;
+      }
+      else if ( ntk.is_pi( ntk.index_to_node( leaf ) ) )
+      {
+        /* reference PIs, add inverter cost for negative phase */
+        if ( leaf_phase == 1u )
+        {
+          if ( node_match[leaf].map_refs[1]++ == 0u )
+            count += lib_inv_area;
+        }
+        else
+        {
+          ++node_match[leaf].map_refs[0];
+        }
+        continue;
+      }
+
+      if ( node_match[leaf].same_match )
+      {
+        /* Add inverter area if not present yet and leaf node is implemented in the opposite phase */
+        if ( node_match[leaf].map_refs[leaf_phase]++ == 0u && node_match[leaf].best_supergate[leaf_phase] == nullptr )
+          count += lib_inv_area;
+        /* Recursive referencing if leaf was not referenced */
+        if ( node_match[leaf].map_refs[2]++ == 0u )
+        {
+          count += cut_ref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      else
+      {
+        ++node_match[leaf].map_refs[2];
+        if ( node_match[leaf].map_refs[leaf_phase]++ == 0u )
+        {
+          count += cut_ref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+    }
+    return count;
+  }
+
+  float cut_deref( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+    float count = node_data.area[phase];
+    uint8_t ctr = 0;
+    for ( auto leaf : cut )
+    {
+      /* compute leaf phase using the current gate */
+      uint8_t leaf_phase = ( node_data.phase[phase] >> ctr++ ) & 1;
+
+      if ( ntk.is_constant( ntk.index_to_node( leaf ) ) )
+      {
+        continue;
+      }
+      else if ( ntk.is_pi( ntk.index_to_node( leaf ) ) )
+      {
+        /* dereference PIs, add inverter cost for negative phase */
+        if ( leaf_phase == 1u )
+        {
+          if ( --node_match[leaf].map_refs[1] == 0u )
+            count += lib_inv_area;
+        }
+        else
+        {
+          --node_match[leaf].map_refs[0];
+        }
+        continue;
+      }
+
+      if ( node_match[leaf].same_match )
+      {
+        /* Add inverter area if it is used only by the current gate and leaf node is implemented in the opposite phase */
+        if ( --node_match[leaf].map_refs[leaf_phase] == 0u && node_match[leaf].best_supergate[leaf_phase] == nullptr )
+          count += lib_inv_area;
+        /* Recursive dereferencing */
+        if ( --node_match[leaf].map_refs[2] == 0u )
+        {
+          count += cut_deref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      else
+      {
+        --node_match[leaf].map_refs[2];
+        if ( --node_match[leaf].map_refs[leaf_phase] == 0u )
+        {
+          count += cut_deref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+    }
+    return count;
+  }
+
+  std::pair<klut_network, klut_map> initialize_map_network()
+  {
+    klut_network dest;
+    klut_map old2new;
+
+    old2new[ntk.node_to_index( ntk.get_node( ntk.get_constant( false ) ) )][0] = dest.get_constant( false );
+    old2new[ntk.node_to_index( ntk.get_node( ntk.get_constant( false ) ) )][1] = dest.get_constant( true );
+
+    ntk.foreach_pi( [&]( auto const& n ) {
+      old2new[ntk.node_to_index( n )][0] = dest.create_pi();
+    } );
+    return { dest, old2new };
+  }
+
+  void finalize_cover( klut_network& res, klut_map& old2new )
+  {
+    ntk.foreach_node( [&]( auto const& n ) {
+      if ( ntk.is_constant( n ) )
+        return true;
+
+      auto index = ntk.node_to_index( n );
+
+      /* add inverter at PI if needed */
+      if ( ntk.is_pi( n ) )
+      {
+        if ( node_match[index].map_refs[1] > 0 )
+          old2new[index][1] = res.create_not( old2new[n][0] );
+        return true;
+      }
+
+      /* continue if cut is not in the cover */
+      if ( node_match[index].map_refs[2] == 0u )
+        return true;
+
+      auto const& node_data = node_match[index];
+      unsigned phase = ( node_data.best_supergate[0] != nullptr ) ? 0 : 1;
+
+      /* add used cut */
+      if ( node_data.same_match || node_data.map_refs[phase] > 0 )
+      {
+        create_lut_for_gate( res, old2new, index, phase );
+
+        /* add inverted version if used */
+        if ( node_data.same_match && node_data.map_refs[phase ^ 1] > 0 )
+          old2new[index][phase ^ 1] = res.create_not( old2new[index][phase] );
+      }
+
+      phase = phase ^ 1;
+      /* add the optional other match if used */
+      if ( !node_data.same_match && node_data.map_refs[phase] > 0 )
+      {
+        create_lut_for_gate( res, old2new, index, phase );
+      }
+
+      return true;
+    } );
+
+    /* create POs */
+    ntk.foreach_po( [&]( auto const& f ) {
+      if ( ntk.is_complemented( f ) )
+      {
+        res.create_po( old2new[ntk.node_to_index( ntk.get_node( f ) )][1] );
+      }
+      else
+      {
+        res.create_po( old2new[ntk.node_to_index( ntk.get_node( f ) )][0] );
+      }
+    } );
+
+    /* write final results */
+    st.area = area;
+    st.delay = delay;
+    compute_gates_usage();
+  }
+
+  void create_lut_for_gate( klut_network& res, klut_map& old2new, uint32_t index, unsigned phase )
+  {
+    auto const& node_data = node_match[index];
+    auto& best_cut = cuts.cuts( index )[node_data.best_cut[phase]];
+    auto const gate = node_data.best_supergate[phase]->root;
+    // auto tt = cuts.truth_table( best_cut );
+
+    /* check correctness */
+    /* invert the truth table if using the negative phase */
+    // if ( phase == 1 )
+    //   tt = ~tt;
+    // uint32_t neg = 0;
+    // for ( auto i = 0u; i < best_cut.size(); ++i )
+    // {
+    //   neg |= ( ( node_data.phase[phase] >> i ) & 1 ) << node_data.best_supergate[phase]->permutation[i];
+    // }
+    // auto check_tt = kitty::create_from_npn_config( std::make_tuple( tt, neg, node_data.best_supergate[phase]->permutation ) );
+    // assert( gate->function == check_tt );
+
+    /* permutate and negate to obtain the matched gate truth table */
+    std::vector<signal<klut_network>> children( best_cut.size() );
+
+    auto ctr = 0u;
+    for ( auto l : best_cut )
+    {
+      children[node_data.best_supergate[phase]->permutation[ctr]] = old2new[l][( node_data.phase[phase] >> ctr ) & 1];
+      ++ctr;
+    }
+    /* create the node */
+    auto f = res.create_node( children, gate->function );
+
+    /* add the node in the data structure */
+    old2new[index][phase] = f;
+  }
+
+  template<bool DO_AREA>
+  inline bool compare_map( double arrival, double best_arrival, double area_flow, double best_area_flow, uint32_t size, uint32_t best_size )
+  {
+    if constexpr ( DO_AREA )
+    {
+      if ( area_flow < best_area_flow - epsilon )
+      {
+        return true;
+      }
+      else if ( area_flow > best_area_flow + epsilon )
+      {
+        return false;
+      }
+      else if ( arrival < best_arrival - epsilon )
+      {
+        return true;
+      }
+      else if ( arrival > best_arrival + epsilon )
+      {
+        return false;
+      }
+    }
+    else
+    {
+      if ( arrival < best_arrival - epsilon )
+      {
+        return true;
+      }
+      else if ( arrival > best_arrival + epsilon )
+      {
+        return false;
+      }
+      else if ( area_flow < best_area_flow - epsilon )
+      {
+        return true;
+      }
+      else if ( area_flow > best_area_flow + epsilon )
+      {
+        return false;
+      }
+    }
+    if ( size < best_size )
+    {
+      return true;
+    }
+    return false;
+  }
+
+  void compute_gates_usage()
+  {
+    auto const& gates = library.get_gates();
+    std::vector<uint32_t> gates_profile( gates.size(), 0u );
+
+    bool ignore_inv = lib_inv_id == UINT32_MAX;
+
+    ntk.foreach_node( [&]( auto const& n, auto ) {
+      const auto index = ntk.node_to_index( n );
+      auto& node_data = node_match[index];
+
+      if ( ntk.is_constant( n ) )
+      {
+        if ( node_data.best_supergate[0] == nullptr && node_data.best_supergate[1] == nullptr )
+          return true;
+      }
+      else if ( ntk.is_pi( n ) )
+      {
+        if ( !ignore_inv && node_data.map_refs[1] > 0 )
+          ++gates_profile[lib_inv_id];
+        return true;
+      }
+
+      /* continue if cut is not in the cover */
+      if ( node_match[index].map_refs[2] == 0u )
+        return true;
+
+      unsigned phase = ( node_data.best_supergate[0] != nullptr ) ? 0 : 1;
+
+      if ( node_data.same_match || node_data.map_refs[phase] > 0 )
+      {
+        ++gates_profile[node_data.best_supergate[phase]->root->id];
+
+        if ( !ignore_inv && node_data.same_match && node_data.map_refs[phase ^ 1] > 0 )
+          ++gates_profile[lib_inv_id];
+      }
+
+      phase = phase ^ 1;
+      if ( !node_data.same_match && node_data.map_refs[phase] > 0 )
+      {
+        ++gates_profile[node_data.best_supergate[phase]->root->id];
+      }
+
+      return true;
+    } );
+
+    std::stringstream gates_usage;
+    double tot_area = 0.0f;
+    uint32_t tot_instances = 0u;
+    for ( auto i = 0u; i < gates_profile.size(); ++i )
+    {
+      if ( gates_profile[i] > 0u )
+      {
+        auto tot_gate_area = gates_profile[i] * gates[i].area;
+
+        gates_usage << fmt::format( "[i] {:<15}", gates[i].name )
+                    << fmt::format( "\t Instance = {:>10d}", gates_profile[i] )
+                    << fmt::format( "\t Area = {:>12.2f}", tot_gate_area )
+                    << fmt::format( " {:>8.2f} %\n", tot_gate_area / area * 100 );
+
+        tot_instances += gates_profile[i];
+        tot_area += tot_gate_area;
+      }
+    }
+
+    gates_usage << fmt::format( "[i] {:<15}", "TOTAL" )
+                << fmt::format( "\t Instance = {:>10d}", tot_instances )
+                << fmt::format( "\t Area = {:>12.2f}   100.00 %\n", tot_area );
+
+    st.gates_usage = gates_usage.str();
+  }
+
+private:
+  Ntk const& ntk;
+  tech_library<NInputs> const& library;
+  map_params const& ps;
+  map_stats& st;
+
+  uint32_t iteration{ 0 };       /* current mapping iteration */
+  double delay{ 0.0f };          /* current delay of the mapping */
+  double area{ 0.0f };           /* current area of the mapping */
+  const float epsilon{ 0.005f }; /* epsilon */
+
+  /* lib inverter info */
+  float lib_inv_area;
+  float lib_inv_delay;
+  uint32_t lib_inv_id;
+
+  std::vector<node<Ntk>> top_order;
+  std::vector<node_match_tech<NInputs>> node_match;
+  std::unordered_map<uint32_t, std::vector<supergate_t>> matches;
+  network_cuts_t cuts;
+};
+
+} /* namespace detail */
+
+/*! \brief Technology mapping.
+ *
+ * This function implements a technology mapping algorithm. It is controlled by a
+ * template argument `CutData` (defaulted to `cut_enumeration_tech_map_cut`).
+ * The argument is similar to the `CutData` argument in `cut_enumeration`, which can
+ * specialize the cost function to select priority cuts and store additional data.
+ * The default argument gives priority firstly to the cut size, then delay, and lastly
+ * to area flow. Thus, it is more suited for delay-oriented mapping.
+ * The type passed as `CutData` must implement the following four fields:
+ *
+ * - `uint32_t delay`
+ * - `float flow`
+ * - `uint8_t match_index`
+ * - `bool ignore`
+ *
+ * See `include/mockturtle/algorithms/cut_enumeration/cut_enumeration_tech_map_cut.hpp`
+ * for one example of a CutData type that implements the cost function that is used in
+ * the technology mapper.
+ *
+ * The function returns a k-LUT network. Each LUT abstacts a gate of the technology library.
+ *
+ * **Required network functions:**
+ * - `size`
+ * - `is_pi`
+ * - `is_constant`
+ * - `node_to_index`
+ * - `index_to_node`
+ * - `get_node`
+ * - `foreach_po`
+ * - `foreach_node`
+ * - `fanout_size`
+ *
+ * \param ntk Network
+ * \param library Technology library
+ * \param ps Mapping params
+ * \param pst Mapping statistics
+ */
+template<class Ntk, unsigned NInputs, typename CutData = cut_enumeration_tech_map_cut>
+klut_network tech_map( Ntk const& ntk, tech_library<NInputs> const& library, map_params const& ps = {}, map_stats* pst = nullptr )
+{
+  static_assert( is_network_type_v<Ntk>, "Ntk is not a network type" );
+  static_assert( has_size_v<Ntk>, "Ntk does not implement the size method" );
+  static_assert( has_is_pi_v<Ntk>, "Ntk does not implement the is_pi method" );
+  static_assert( has_is_constant_v<Ntk>, "Ntk does not implement the is_constant method" );
+  static_assert( has_node_to_index_v<Ntk>, "Ntk does not implement the node_to_index method" );
+  static_assert( has_index_to_node_v<Ntk>, "Ntk does not implement the index_to_node method" );
+  static_assert( has_get_node_v<Ntk>, "Ntk does not implement the get_node method" );
+  static_assert( has_foreach_po_v<Ntk>, "Ntk does not implement the foreach_po method" );
+  static_assert( has_foreach_node_v<Ntk>, "Ntk does not implement the foreach_node method" );
+  static_assert( has_fanout_size_v<Ntk>, "Ntk does not implement the fanout_size method" );
+
+  map_stats st;
+  detail::tech_map_impl<Ntk, NInputs, CutData> p( ntk, library, ps, st );
+  auto res = p.run();
+
+  st.time_total = st.time_mapping + st.cut_enumeration_st.time_total;
+  if ( ps.verbose && !st.mapping_error )
+  {
+    st.report();
+  }
+
+  if ( pst )
+  {
+    *pst = st;
+  }
+  return res;
+}
+
+namespace detail
+{
+
+template<typename Ntk, unsigned NInputs>
+struct cut_match_t
+{
+  /* list of supergates matching the cut for positive and negative output phases */
+  std::vector<exact_supergate<Ntk, NInputs>> const* supergates[2] = { nullptr, nullptr };
+  /* input permutations, at index i, it contains the permutated position of i */
+  std::array<uint8_t, NInputs> permutation{};
+  /* permutated input negations */
+  uint8_t negation{ 0 };
+};
+
+template<typename Ntk, unsigned NInputs>
+struct node_match_t
+{
+  /* best supergate match for positive and negative output phases */
+  exact_supergate<Ntk, NInputs> const* best_supergate[2] = { nullptr, nullptr };
+  /* fanin pin phases for both output phases */
+  uint8_t phase[2];
+  /* best cut index for both phases */
+  uint32_t best_cut[2];
+  /* node is mapped using only one phase */
+  bool same_match{ false };
+
+  /* arrival time at node output */
+  double arrival[2];
+  /* required time at node output */
+  double required[2];
+  /* area of the best matches */
+  float area[2];
+
+  /* number of references in the cover 0: pos, 1: neg, 2: pos+neg */
+  uint32_t map_refs[3];
+  /* references estimation */
+  float est_refs[3];
+  /* area flow */
+  float flows[3];
+};
+
+template<class NtkDest, class Ntk, class RewritingFn, typename CutData, unsigned NInputs>
+class exact_map_impl
+{
+public:
+  using network_cuts_t = network_cuts<Ntk, true, CutData>;
+  using cut_t = typename network_cuts_t::cut_t;
+
+public:
+  exact_map_impl( Ntk& ntk, exact_library<NtkDest, RewritingFn, NInputs> const& library, map_params const& ps, map_stats& st )
+      : ntk( ntk ),
+        library( library ),
+        ps( ps ),
+        st( st ),
+        node_match( ntk.size() ),
+        matches(),
+        cuts( cut_enumeration<Ntk, true, CutData>( ntk, ps.cut_enumeration_ps ) )
+  {
+    std::tie( lib_inv_area, lib_inv_delay ) = library.get_inverter_info();
+  }
+
+  NtkDest run()
+  {
+    stopwatch t( st.time_mapping );
+
+    auto [res, old2new] = initialize_copy_network<NtkDest>( ntk );
+
+    /* compute and save topological order */
+    top_order.reserve( ntk.size() );
+    topo_view<Ntk>( ntk ).foreach_node( [this]( auto n ) {
+      top_order.push_back( n );
+    } );
+
+    /* match cuts with gates */
+    compute_matches();
+
+    /* init the data structure */
+    init_nodes();
+
+    /* compute mapping delay */
+    if ( !ps.skip_delay_round )
+    {
+      compute_mapping<false>();
+    }
+
+    /* compute mapping using global area flow */
+    while ( iteration < ps.area_flow_rounds + 1 )
+    {
+      compute_required_time();
+      compute_mapping<true>();
+    }
+
+    /* compute mapping using exact area */
+    while ( iteration < ps.ela_rounds + ps.area_flow_rounds + 1 )
+    {
+      compute_required_time();
+      compute_exact_area();
+    }
+
+    /* generate the output network using the computed mapping */
+    finalize_cover( res, old2new );
+
+    return res;
+  }
+
+private:
+  void init_nodes()
+  {
+    ntk.foreach_node( [this]( auto const& n, auto ) {
+      const auto index = ntk.node_to_index( n );
+      auto& node_data = node_match[index];
+
+      node_data.est_refs[0] = node_data.est_refs[1] = node_data.est_refs[2] = static_cast<float>( ntk.fanout_size( n ) );
+
+      if ( ntk.is_constant( n ) )
+      {
+        /* all terminals have flow 1.0 */
+        node_data.flows[0] = node_data.flows[1] = node_data.flows[2] = 0.0f;
+        node_data.arrival[0] = node_data.arrival[1] = 0.0f;
+      }
+      else if ( ntk.is_pi( n ) )
+      {
+        /* all terminals have flow 1.0 */
+        node_data.flows[0] = node_data.flows[1] = node_data.flows[2] = 0.0f;
+        node_data.arrival[0] = 0.0f;
+        /* PIs have the negative phase implemented with an inverter */
+        node_data.arrival[1] = lib_inv_delay;
+      }
+    } );
+  }
+
+  void compute_matches()
+  {
+    /* match gates */
+    ntk.foreach_gate( [&]( auto const& n ) {
+      const auto index = ntk.node_to_index( n );
+
+      std::vector<cut_match_t<NtkDest, NInputs>> node_matches;
+
+      auto i = 0u;
+      for ( auto& cut : cuts.cuts( index ) )
+      {
+        /* ignore unit cut */
+        if ( cut->size() == 1 && *cut->begin() == index )
+        {
+          ( *cut )->data.ignore = true;
+          continue;
+        }
+
+        if ( cut->size() > NInputs )
+        {
+          /* Ignore cuts too big to be mapped using the library */
+          ( *cut )->data.ignore = true;
+          continue;
+        }
+
+        /* match the cut using canonization and get the gates */
+        const auto tt = cuts.truth_table( *cut );
+        const auto fe = kitty::extend_to<NInputs>( tt );
+        const auto config = kitty::exact_npn_canonization( fe );
+        auto const supergates_npn = library.get_supergates( std::get<0>( config ) );
+        auto const supergates_npn_neg = library.get_supergates( ~std::get<0>( config ) );
+
+        if ( supergates_npn != nullptr || supergates_npn_neg != nullptr )
+        {
+          auto neg = std::get<1>( config );
+          auto perm = std::get<2>( config );
+          uint8_t phase = ( neg >> NInputs ) & 1;
+          cut_match_t<NtkDest, NInputs> match;
+
+          match.supergates[phase] = supergates_npn;
+          match.supergates[phase ^ 1] = supergates_npn_neg;
+
+          /* store permutations and negations */
+          match.negation = 0;
+          for ( auto j = 0u; j < perm.size() && j < NInputs; ++j )
+          {
+            match.permutation[perm[j]] = j;
+            match.negation |= ( ( neg >> perm[j] ) & 1 ) << j;
+          }
+          node_matches.push_back( match );
+          ( *cut )->data.match_index = i++;
+        }
+        else
+        {
+          /* Ignore not matched cuts */
+          ( *cut )->data.ignore = true;
+        }
+      }
+
+      matches[index] = node_matches;
+    } );
+  }
+
+  template<bool DO_AREA>
+  void compute_mapping()
+  {
+    for ( auto const& n : top_order )
+    {
+      if ( ntk.is_constant( n ) || ntk.is_pi( n ) )
+        continue;
+
+      /* match positive phase */
+      match_phase<DO_AREA>( n, 0u );
+
+      /* match negative phase */
+      match_phase<DO_AREA>( n, 1u );
+
+      /* try to drop one phase */
+      match_drop_phase<DO_AREA, false>( n, 0u );
+    }
+
+    double area_old = area;
+    set_mapping_refs<false>();
+
+    /* round stats */
+    if ( ps.verbose )
+    {
+      std::stringstream stats{};
+      float area_gain = 0.0f;
+
+      if ( iteration != 1 )
+        area_gain = float( ( area_old - area ) / area_old * 100 );
+
+      if constexpr ( DO_AREA )
+      {
+        stats << fmt::format( "[i] AreaFlow : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      }
+      else
+      {
+        stats << fmt::format( "[i] Delay    : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      }
+      st.round_stats.push_back( stats.str() );
+    }
+  }
+
+  void compute_exact_area()
+  {
+    for ( auto const& n : top_order )
+    {
+      if ( ntk.is_constant( n ) || ntk.is_pi( n ) )
+        continue;
+
+      auto index = ntk.node_to_index( n );
+      auto& node_data = node_match[index];
+
+      /* recursively deselect the best cut shared between
+       * the two phases if in use in the cover */
+      if ( node_data.same_match && node_data.map_refs[2] != 0 )
+      {
+        if ( node_data.best_supergate[0] != nullptr )
+          cut_deref( cuts.cuts( index )[node_data.best_cut[0]], n, 0u );
+        else
+          cut_deref( cuts.cuts( index )[node_data.best_cut[1]], n, 1u );
+      }
+
+      /* match positive phase */
+      match_phase_exact( n, 0u );
+
+      /* match negative phase */
+      match_phase_exact( n, 1u );
+
+      /* try to drop one phase */
+      match_drop_phase<true, true>( n, 0u );
+    }
+
+    double area_old = area;
+    set_mapping_refs<true>();
+
+    /* round stats */
+    if ( ps.verbose )
+    {
+      float area_gain = float( ( area_old - area ) / area_old * 100 );
+      std::stringstream stats{};
+      stats << fmt::format( "[i] Area     : Delay = {:>12.2f}  Area = {:>12.2f}  {:>5.2f} %\n", delay, area, area_gain );
+      st.round_stats.push_back( stats.str() );
+    }
+  }
+
+  void finalize_cover( NtkDest& res, node_map<signal<NtkDest>, Ntk>& old2new )
+  {
+    auto const& db = library.get_database();
+
+    ntk.foreach_node( [&]( auto const& n ) {
+      if ( ntk.is_constant( n ) || ntk.is_pi( n ) )
+        return true;
+      auto index = ntk.node_to_index( n );
+      if ( node_match[index].map_refs[2] == 0u )
+        return true;
+
+      /* get the implemented phase and map the best cut */
+      unsigned phase = ( node_match[index].best_supergate[0] != nullptr ) ? 0 : 1;
+      auto& best_cut = cuts.cuts( index )[node_match[index].best_cut[phase]];
+
+      std::vector<signal<NtkDest>> children( NInputs, res.get_constant( false ) );
+      auto const& match = matches[index][best_cut->data.match_index];
+      auto const& supergate = node_match[index].best_supergate[phase];
+      auto ctr = 0u;
+      for ( auto l : best_cut )
+      {
+        children[match.permutation[ctr++]] = old2new[ntk.index_to_node( l )];
+      }
+      for ( auto i = 0u; i < NInputs; ++i )
+      {
+        if ( ( match.negation >> i ) & 1 )
+        {
+          children[i] = !children[i];
+        }
+      }
+      topo_view topo{ db, supergate->root };
+      auto f = cleanup_dangling( topo, res, children.begin(), children.end() ).front();
+
+      if ( phase == 1 )
+        f = !f;
+
+      old2new[n] = f;
+      return true;
+    } );
+
+    /* create POs */
+    ntk.foreach_po( [&]( auto const& f ) {
+      res.create_po( ntk.is_complemented( f ) ? res.create_not( old2new[f] ) : old2new[f] );
+    } );
+
+    /* write final results */
+    st.area = area;
+    st.delay = delay;
+  }
+
+  template<bool ELA>
+  void set_mapping_refs()
+  {
+    const auto coef = 1.0f / ( 2.0f + ( iteration + 1 ) * ( iteration + 1 ) );
+
+    if constexpr ( !ELA )
+    {
+      for ( auto i = 0u; i < node_match.size(); ++i )
+      {
+        node_match[i].map_refs[0] = node_match[i].map_refs[1] = node_match[i].map_refs[2] = 0u;
+      }
+    }
+
+    /* compute current delay and update mapping refs */
+    delay = 0.0f;
+    ntk.foreach_po( [this]( auto s ) {
+      const auto index = ntk.node_to_index( ntk.get_node( s ) );
+      if ( ntk.is_complemented( s ) )
+        delay = std::max( delay, node_match[index].arrival[1] );
+      else
+        delay = std::max( delay, node_match[index].arrival[0] );
+
+      if constexpr ( !ELA )
+      {
+        node_match[index].map_refs[2]++;
+        if ( ntk.is_complemented( s ) )
+          node_match[index].map_refs[1]++;
+        else
+          node_match[index].map_refs[0]++;
+      }
+    } );
+
+    /* compute current area and update mapping refs in top-down order */
+    area = 0.0f;
+    for ( auto it = top_order.rbegin(); it != top_order.rend(); ++it )
+    {
+      const auto index = ntk.node_to_index( *it );
+      /* skip constants and PIs */
+      if ( ntk.is_pi( *it ) )
+      {
+        if ( node_match[index].map_refs[1] > 0u )
+        {
+          /* Add inverter over the negated fanins */
+          area += lib_inv_area;
+        }
+        continue;
+      }
+      else if ( ntk.is_constant( *it ) )
+      {
+        continue;
+      }
+
+      if ( node_match[index].map_refs[2] == 0u )
+        continue;
+
+      auto& node_data = node_match[index];
+      unsigned use_phase = node_data.best_supergate[0] == nullptr ? 1u : 0u;
+
+      if ( node_data.same_match || node_data.map_refs[use_phase] > 0 )
+      {
+        if constexpr ( !ELA )
+        {
+          auto const& best_cut = cuts.cuts( index )[node_data.best_cut[use_phase]];
+          auto const& match = matches[index][best_cut->data.match_index];
+          auto ctr = 0u;
+          for ( auto const leaf : best_cut )
+          {
+            node_match[leaf].map_refs[2]++;
+            if ( ( node_data.phase[use_phase] >> match.permutation[ctr++] ) & 1 )
+              node_match[leaf].map_refs[1]++;
+            else
+              node_match[leaf].map_refs[0]++;
+          }
+        }
+        area += node_data.area[use_phase];
+        if ( node_data.same_match && node_data.map_refs[use_phase ^ 1] > 0 )
+        {
+          area += lib_inv_area;
+        }
+      }
+
+      /* invert the phase */
+      use_phase = use_phase ^ 1;
+
+      /* if both phases are implemented and used */
+      if ( !node_data.same_match && node_data.map_refs[use_phase] > 0 )
+      {
+        if constexpr ( !ELA )
+        {
+          auto const& best_cut = cuts.cuts( index )[node_data.best_cut[use_phase]];
+          auto const& match = matches[index][best_cut->data.match_index];
+          auto ctr = 0u;
+          for ( auto const leaf : best_cut )
+          {
+            node_match[leaf].map_refs[2]++;
+            if ( ( node_data.phase[use_phase] >> match.permutation[ctr++] ) & 1 )
+              node_match[leaf].map_refs[1]++;
+            else
+              node_match[leaf].map_refs[0]++;
+          }
+        }
+        area += node_data.area[use_phase];
+      }
+    }
+
+    /* blend flow references */
+    for ( auto i = 0u; i < ntk.size(); ++i )
+    {
+      node_match[i].est_refs[2] = coef * node_match[i].est_refs[2] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[2] ) );
+      node_match[i].est_refs[1] = coef * node_match[i].est_refs[1] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[1] ) );
+      node_match[i].est_refs[0] = coef * node_match[i].est_refs[0] + ( 1.0f - coef ) * std::max( 1.0f, static_cast<float>( node_match[i].map_refs[0] ) );
+    }
+
+    ++iteration;
+  }
+
+  void compute_required_time()
+  {
+    for ( auto i = 0u; i < node_match.size(); ++i )
+    {
+      node_match[i].required[0] = node_match[i].required[1] = std::numeric_limits<float>::max();
+    }
+
+    /* return in case of `skip_delay_round` */
+    if ( iteration == 0 )
+      return;
+
+    auto required = delay;
+
+    if ( ps.required_time != 0.0f )
+    {
+      /* Global target time constraint */
+      if ( ps.required_time < delay - epsilon )
+      {
+        if ( !ps.skip_delay_round && iteration == 1 )
+          std::cerr << fmt::format( "[i] MAP WARNING: cannot meet the target required time of {:.2f}", ps.required_time ) << std::endl;
+      }
+      else
+      {
+        required = ps.required_time;
+      }
+    }
+
+    /* set the required time at POs */
+    ntk.foreach_po( [&]( auto const& s ) {
+      const auto index = ntk.node_to_index( ntk.get_node( s ) );
+      if ( ntk.is_complemented( s ) )
+        node_match[index].required[1] = required;
+      else
+        node_match[index].required[0] = required;
+    } );
+
+    /* propagate required time to the PIs */
+    auto i = ntk.size();
+    while ( i-- > 0u )
+    {
+      const auto n = ntk.index_to_node( i );
+      if ( ntk.is_pi( n ) || ntk.is_constant( n ) )
+        break;
+
+      if ( node_match[i].map_refs[2] == 0 )
+        continue;
+
+      auto& node_data = node_match[i];
+
+      unsigned use_phase = node_data.best_supergate[0] == nullptr ? 1u : 0u;
+      unsigned other_phase = use_phase ^ 1;
+
+      assert( node_data.best_supergate[0] != nullptr || node_data.best_supergate[1] != nullptr );
+      assert( node_data.map_refs[0] || node_data.map_refs[1] );
+
+      /* propagate required time over output inverter if present */
+      if ( node_data.same_match && node_data.map_refs[other_phase] > 0 )
+      {
+        node_data.required[use_phase] = std::min( node_data.required[use_phase], node_data.required[other_phase] - lib_inv_delay );
+      }
+
+      if ( node_data.same_match || node_data.map_refs[use_phase] > 0 )
+      {
+        auto ctr = 0u;
+        auto best_cut = cuts.cuts( i )[node_data.best_cut[use_phase]];
+        auto const& match = matches[i][best_cut->data.match_index];
+        auto const& supergate = node_data.best_supergate[use_phase];
+        for ( auto leaf : best_cut )
+        {
+          auto phase = ( node_data.phase[use_phase] >> match.permutation[ctr] ) & 1;
+          node_match[leaf].required[phase] = std::min( node_match[leaf].required[phase], node_data.required[use_phase] - supergate->tdelay[match.permutation[ctr]] );
+          ctr++;
+        }
+      }
+
+      if ( !node_data.same_match && node_data.map_refs[other_phase] > 0 )
+      {
+        auto ctr = 0u;
+        auto best_cut = cuts.cuts( i )[node_data.best_cut[other_phase]];
+        auto const& match = matches[i][best_cut->data.match_index];
+        auto const& supergate = node_data.best_supergate[other_phase];
+        for ( auto leaf : best_cut )
+        {
+          auto phase = ( node_data.phase[other_phase] >> match.permutation[ctr] ) & 1;
+          node_match[leaf].required[phase] = std::min( node_match[leaf].required[phase], node_data.required[other_phase] - supergate->tdelay[match.permutation[ctr]] );
+          ctr++;
+        }
+      }
+    }
+  }
+
+  template<bool DO_AREA>
+  void match_phase( node<Ntk> const& n, uint8_t phase )
+  {
+    float best_arrival = std::numeric_limits<float>::max();
+    float best_area_flow = std::numeric_limits<float>::max();
+    float best_area = std::numeric_limits<float>::max();
+    uint32_t best_size = UINT32_MAX;
+    uint8_t best_cut = 0u;
+    uint8_t best_phase = 0u;
+    uint8_t cut_index = 0u;
+    auto index = ntk.node_to_index( n );
+
+    auto& node_data = node_match[index];
+    auto& cut_matches = matches[index];
+    exact_supergate<NtkDest, NInputs> const* best_supergate = node_data.best_supergate[phase];
+
+    /* recompute best match info */
+    if ( best_supergate != nullptr )
+    {
+      auto const& cut = cuts.cuts( index )[node_data.best_cut[phase]];
+      auto& supergates = cut_matches[( cut )->data.match_index];
+
+      /* permutate the children to the NPN-represenentative configuration */
+      std::vector<uint32_t> children( NInputs, 0u );
+      auto ctr = 0u;
+      for ( auto l : cut )
+      {
+        children[supergates.permutation[ctr++]] = l;
+      }
+
+      best_phase = node_data.phase[phase];
+      best_arrival = 0.0f;
+      best_area_flow = best_supergate->area + cut_leaves_flow( cut, n, phase );
+      best_area = best_supergate->area;
+      best_cut = node_data.best_cut[phase];
+      best_size = cut.size();
+      for ( auto pin = 0u; pin < NInputs; pin++ )
+      {
+        float arrival_pin = node_match[children[pin]].arrival[( best_phase >> pin ) & 1] + best_supergate->tdelay[pin];
+        best_arrival = std::max( best_arrival, arrival_pin );
+      }
+    }
+
+    /* foreach cut */
+    for ( auto& cut : cuts.cuts( index ) )
+    {
+      /* trivial cuts or not matched cuts */
+      if ( ( *cut )->data.ignore )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      auto const& supergates = cut_matches[( *cut )->data.match_index];
+
+      if ( supergates.supergates[phase] == nullptr )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      /* permutate the children to the NPN-represenentative configuration */
+      std::vector<uint32_t> children( NInputs, 0u );
+      auto ctr = 0u;
+      for ( auto l : *cut )
+      {
+        children[supergates.permutation[ctr++]] = l;
+      }
+
+      /* match each gate and take the best one */
+      for ( auto const& gate : *supergates.supergates[phase] )
+      {
+        uint8_t complement = supergates.negation;
+        node_data.phase[phase] = complement;
+        float area_local = gate.area + cut_leaves_flow( *cut, n, phase );
+        float worst_arrival = 0.0f;
+        for ( auto pin = 0u; pin < NInputs; pin++ )
+        {
+          float arrival_pin = node_match[children[pin]].arrival[( complement >> pin ) & 1] + gate.tdelay[pin];
+          worst_arrival = std::max( worst_arrival, arrival_pin );
+        }
+
+        if constexpr ( DO_AREA )
+        {
+          if ( worst_arrival > node_data.required[phase] + epsilon )
+            continue;
+        }
+
+        if ( compare_map<DO_AREA>( worst_arrival, best_arrival, area_local, best_area_flow, cut->size(), best_size ) )
+        {
+          best_arrival = worst_arrival;
+          best_area_flow = area_local;
+          best_size = cut->size();
+          best_cut = cut_index;
+          best_area = gate.area;
+          best_phase = complement;
+          best_supergate = &gate;
+        }
+      }
+
+      ++cut_index;
+    }
+
+    node_data.flows[phase] = best_area_flow;
+    node_data.arrival[phase] = best_arrival;
+    node_data.area[phase] = best_area;
+    node_data.best_cut[phase] = best_cut;
+    node_data.phase[phase] = best_phase;
+    node_data.best_supergate[phase] = best_supergate;
+  }
+
+  void match_phase_exact( node<Ntk> const& n, uint8_t phase )
+  {
+    float best_arrival = std::numeric_limits<float>::max();
+    float best_exact_area = std::numeric_limits<float>::max();
+    float best_area = std::numeric_limits<float>::max();
+    uint32_t best_size = UINT32_MAX;
+    uint8_t best_cut = 0u;
+    uint8_t best_phase = 0u;
+    uint8_t cut_index = 0u;
+    auto index = ntk.node_to_index( n );
+
+    auto& node_data = node_match[index];
+    auto& cut_matches = matches[index];
+    exact_supergate<NtkDest, NInputs> const* best_supergate = node_data.best_supergate[phase];
+
+    /* recompute best match info */
+    if ( best_supergate != nullptr )
+    {
+      auto const& cut = cuts.cuts( index )[node_data.best_cut[phase]];
+      auto const& supergates = cut_matches[( cut )->data.match_index];
+
+      /* permutate the children to the NPN-represenentative configuration */
+      std::vector<uint32_t> children( NInputs, 0u );
+      auto ctr = 0u;
+      for ( auto l : cut )
+      {
+        children[supergates.permutation[ctr++]] = l;
+      }
+
+      best_phase = supergates.negation;
+      best_arrival = 0.0f;
+      best_area = best_supergate->area;
+      best_cut = node_data.best_cut[phase];
+      best_size = cut.size();
+      for ( auto pin = 0u; pin < NInputs; pin++ )
+      {
+        float arrival_pin = node_match[children[pin]].arrival[( best_phase >> pin ) & 1] + best_supergate->tdelay[pin];
+        best_arrival = std::max( best_arrival, arrival_pin );
+      }
+
+      /* if cut is implemented, remove it from the cover */
+      if ( !node_data.same_match && node_data.map_refs[phase] )
+      {
+        best_exact_area = cut_deref( cuts.cuts( index )[best_cut], n, phase );
+      }
+      else
+      {
+        best_exact_area = cut_ref( cuts.cuts( index )[best_cut], n, phase );
+        cut_deref( cuts.cuts( index )[best_cut], n, phase );
+      }
+    }
+
+    /* foreach cut */
+    for ( auto& cut : cuts.cuts( index ) )
+    {
+      /* trivial cuts or not matched cuts */
+      if ( ( *cut )->data.ignore )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      auto const& supergates = cut_matches[( *cut )->data.match_index];
+
+      if ( supergates.supergates[phase] == nullptr )
+      {
+        ++cut_index;
+        continue;
+      }
+
+      /* permutate the children to the NPN-represenentative configuration */
+      std::vector<uint32_t> children( NInputs, 0u );
+      auto ctr = 0u;
+      for ( auto l : *cut )
+      {
+        children[supergates.permutation[ctr++]] = l;
+      }
+
+      for ( auto const& gate : *supergates.supergates[phase] )
+      {
+        uint8_t complement = supergates.negation;
+        node_data.phase[phase] = complement;
+        node_data.area[phase] = gate.area;
+        auto area_exact = cut_ref( *cut, n, phase );
+        cut_deref( *cut, n, phase );
+        float worst_arrival = 0.0f;
+        for ( auto pin = 0u; pin < NInputs; pin++ )
+        {
+          float arrival_pin = node_match[children[pin]].arrival[( complement >> pin ) & 1] + gate.tdelay[pin];
+          worst_arrival = std::max( worst_arrival, arrival_pin );
+        }
+
+        if ( worst_arrival > node_data.required[phase] + epsilon )
+          continue;
+
+        if ( compare_map<true>( worst_arrival, best_arrival, area_exact, best_exact_area, cut->size(), best_size ) )
+        {
+          best_arrival = worst_arrival;
+          best_exact_area = area_exact;
+          best_area = gate.area;
+          best_size = cut->size();
+          best_cut = cut_index;
+          best_phase = complement;
+          best_supergate = &gate;
+        }
+      }
+
+      ++cut_index;
+    }
+
+    node_data.flows[phase] = best_exact_area;
+    node_data.arrival[phase] = best_arrival;
+    node_data.area[phase] = best_area;
+    node_data.best_cut[phase] = best_cut;
+    node_data.phase[phase] = best_phase;
+    node_data.best_supergate[phase] = best_supergate;
+
+    if ( !node_data.same_match && node_data.map_refs[phase] )
+    {
+      best_exact_area = cut_ref( cuts.cuts( index )[best_cut], n, phase );
+    }
+  }
+
+  template<bool DO_AREA, bool ELA>
+  void match_drop_phase( node<Ntk> const& n, unsigned area_margin_factor )
+  {
+    auto index = ntk.node_to_index( n );
+    auto& node_data = node_match[index];
+
+    /* compute arrival adding an inverter to the other match phase */
+    float worst_arrival_npos = node_data.arrival[1] + lib_inv_delay;
+    float worst_arrival_nneg = node_data.arrival[0] + lib_inv_delay;
+    bool use_zero = false;
+    bool use_one = false;
+
+    /* only one phase is matched */
+    if ( node_data.best_supergate[0] == nullptr )
+    {
+      set_match_complemented_phase( index, 1, worst_arrival_npos );
+      if constexpr ( ELA )
+      {
+        if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+      }
+      return;
+    }
+    else if ( node_data.best_supergate[1] == nullptr )
+    {
+      set_match_complemented_phase( index, 0, worst_arrival_nneg );
+      if constexpr ( ELA )
+      {
+        if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+      }
+      return;
+    }
+
+    /* try to use only one match to cover both phases */
+    if constexpr ( !DO_AREA )
+    {
+      /* if arrival is less matching the other phase and inserting an inverter */
+      if ( worst_arrival_npos < node_data.arrival[0] + epsilon )
+      {
+        use_one = true;
+      }
+      if ( worst_arrival_nneg < node_data.arrival[1] + epsilon )
+      {
+        use_zero = true;
+      }
+      if ( !use_zero && !use_one )
+      {
+        /* use both phases to improve delay */
+        node_data.flows[2] = ( node_data.flows[0] + node_data.flows[1] ) / node_data.est_refs[2];
+        node_data.flows[0] = node_data.flows[0] / node_data.est_refs[0];
+        node_data.flows[1] = node_data.flows[1] / node_data.est_refs[1];
+        return;
+      }
+    }
+    else
+    {
+      /* check if both phases + inverter meet the required time */
+      use_zero = worst_arrival_nneg < node_data.required[1] + epsilon - area_margin_factor * lib_inv_delay;
+      use_one = worst_arrival_npos < node_data.required[0] + epsilon - area_margin_factor * lib_inv_delay;
+    }
+
+    /* use area flow as a tiebreaker. Unfortunatly cannot keep
+     * the both phases since `node_map` does not support that */
+    if ( use_zero && use_one )
+    {
+      auto size_zero = cuts.cuts( index )[node_data.best_cut[0]].size();
+      auto size_one = cuts.cuts( index )[node_data.best_cut[1]].size();
+      if ( compare_map<DO_AREA>( worst_arrival_nneg, worst_arrival_npos, node_data.flows[0], node_data.flows[1], size_zero, size_one ) )
+        use_one = false;
+      else
+        use_zero = false;
+    }
+
+    if ( use_zero )
+    {
+      if constexpr ( ELA )
+      {
+        if ( !node_data.same_match )
+        {
+          if ( node_data.map_refs[1] > 0 )
+            cut_deref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+          if ( node_data.map_refs[0] == 0 )
+            cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+        }
+        else if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+      }
+      set_match_complemented_phase( index, 0, worst_arrival_nneg );
+    }
+    else
+    {
+      if constexpr ( ELA )
+      {
+        if ( !node_data.same_match )
+        {
+          if ( node_data.map_refs[0] > 0 )
+            cut_deref( cuts.cuts( index )[node_data.best_cut[0]], n, 0 );
+          if ( node_data.map_refs[1] == 0 && node_data.map_refs[2] )
+            cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+        }
+        else if ( node_data.map_refs[2] )
+          cut_ref( cuts.cuts( index )[node_data.best_cut[1]], n, 1 );
+      }
+      set_match_complemented_phase( index, 1, worst_arrival_npos );
+    }
+  }
+
+  inline void set_match_complemented_phase( uint32_t index, uint8_t phase, float worst_arrival_n )
+  {
+    auto& node_data = node_match[index];
+    auto phase_n = phase ^ 1;
+    node_data.same_match = true;
+    node_data.best_supergate[phase_n] = nullptr;
+    node_data.best_cut[phase_n] = node_data.best_cut[phase];
+    node_data.phase[phase_n] = node_data.phase[phase] ^ ( 1 << NInputs );
+    node_data.arrival[phase_n] = worst_arrival_n;
+    node_data.area[phase_n] = node_data.area[phase];
+    node_data.flows[phase] = node_data.flows[phase] / node_data.est_refs[2];
+    node_data.flows[phase_n] = node_data.flows[phase];
+    node_data.flows[2] = node_data.flows[phase];
+  }
+
+  inline float cut_leaves_flow( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    float flow{ 0.0f };
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+    auto const& match = matches[ntk.node_to_index( n )][cut->data.match_index];
+
+    uint8_t ctr = 0u;
+    for ( auto leaf : cut )
+    {
+      uint8_t leaf_phase = ( node_data.phase[phase] >> match.permutation[ctr++] ) & 1;
+      flow += node_match[leaf].flows[leaf_phase];
+    }
+
+    return flow;
+  }
+
+  float cut_ref( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+    auto const& match = matches[ntk.node_to_index( n )][cut->data.match_index];
+    float count = node_data.area[phase];
+    uint8_t ctr = 0;
+    for ( auto leaf : cut )
+    {
+      /* compute leaf phase using the current gate */
+      uint8_t leaf_phase = ( node_data.phase[phase] >> match.permutation[ctr] ) & 1;
+
+      if ( ntk.is_constant( ntk.index_to_node( leaf ) ) )
+      {
+        ++ctr;
+        continue;
+      }
+      else if ( ntk.is_pi( ntk.index_to_node( leaf ) ) )
+      {
+        /* reference PIs, add inverter cost for negative phase */
+        if ( leaf_phase == 1u )
+        {
+          if ( node_match[leaf].map_refs[1]++ == 0u )
+            count += lib_inv_area;
+        }
+        else
+        {
+          ++node_match[leaf].map_refs[0];
+        }
+        ++ctr;
+        continue;
+      }
+
+      if ( node_match[leaf].same_match )
+      {
+        /* Add inverter area if not present yet and leaf node is implemented in the opposite phase */
+        if ( node_match[leaf].map_refs[leaf_phase]++ == 0u && node_match[leaf].best_supergate[leaf_phase] == nullptr )
+          count += lib_inv_area;
+        /* Recursive referencing if leaf was not referenced */
+        if ( node_match[leaf].map_refs[2]++ == 0u )
+        {
+          count += cut_ref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      else
+      {
+        ++node_match[leaf].map_refs[2];
+        if ( node_match[leaf].map_refs[leaf_phase]++ == 0u )
+        {
+          count += cut_ref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      ++ctr;
+    }
+    return count;
+  }
+
+  float cut_deref( cut_t const& cut, node<Ntk> const& n, uint8_t phase )
+  {
+    auto const& node_data = node_match[ntk.node_to_index( n )];
+    auto const& match = matches[ntk.node_to_index( n )][cut->data.match_index];
+    float count = node_data.area[phase];
+    uint8_t ctr = 0;
+    for ( auto leaf : cut )
+    {
+      /* compute leaf phase using the current gate */
+      uint8_t leaf_phase = ( node_data.phase[phase] >> match.permutation[ctr] ) & 1;
+
+      if ( ntk.is_constant( ntk.index_to_node( leaf ) ) )
+      {
+        ++ctr;
+        continue;
+      }
+      else if ( ntk.is_pi( ntk.index_to_node( leaf ) ) )
+      {
+        /* dereference PIs, add inverter cost for negative phase */
+        if ( leaf_phase == 1u )
+        {
+          if ( --node_match[leaf].map_refs[1] == 0u )
+            count += lib_inv_area;
+        }
+        else
+        {
+          --node_match[leaf].map_refs[0];
+        }
+        ++ctr;
+        continue;
+      }
+
+      if ( node_match[leaf].same_match )
+      {
+        /* Add inverter area if it is used only by the current gate and leaf node is implemented in the opposite phase */
+        if ( --node_match[leaf].map_refs[leaf_phase] == 0u && node_match[leaf].best_supergate[leaf_phase] == nullptr )
+          count += lib_inv_area;
+        /* Recursive dereferencing */
+        if ( --node_match[leaf].map_refs[2] == 0u )
+        {
+          count += cut_deref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      else
+      {
+        --node_match[leaf].map_refs[2];
+        if ( --node_match[leaf].map_refs[leaf_phase] == 0u )
+        {
+          count += cut_deref( cuts.cuts( leaf )[node_match[leaf].best_cut[leaf_phase]], ntk.index_to_node( leaf ), leaf_phase );
+        }
+      }
+      ++ctr;
+    }
+    return count;
+  }
+
+  template<bool DO_AREA>
+  inline bool compare_map( float arrival, float best_arrival, float area_flow, float best_area_flow, uint32_t size, uint32_t best_size )
+  {
+    if constexpr ( DO_AREA )
+    {
+      if ( area_flow < best_area_flow - epsilon )
+      {
+        return true;
+      }
+      else if ( area_flow > best_area_flow + epsilon )
+      {
+        return false;
+      }
+      else if ( arrival < best_arrival - epsilon )
+      {
+        return true;
+      }
+      else if ( arrival > best_arrival + epsilon )
+      {
+        return false;
+      }
+    }
+    else
+    {
+      if ( arrival < best_arrival - epsilon )
+      {
+        return true;
+      }
+      else if ( arrival > best_arrival + epsilon )
+      {
+        return false;
+      }
+      else if ( area_flow < best_area_flow - epsilon )
+      {
+        return true;
+      }
+      else if ( area_flow > best_area_flow + epsilon )
+      {
+        return false;
+      }
+    }
+    if ( size < best_size )
+    {
+      return true;
+    }
+    return false;
+  }
+
+private:
+  Ntk& ntk;
+  exact_library<NtkDest, RewritingFn, NInputs> const& library;
+  map_params const& ps;
+  map_stats& st;
+
+  uint32_t iteration{ 0 };       /* current mapping iteration */
+  double delay{ 0.0f };          /* current delay of the mapping */
+  double area{ 0.0f };           /* current area of the mapping */
+  const float epsilon{ 0.005f }; /* epsilon */
+
+  /* lib inverter info */
+  float lib_inv_area;
+  float lib_inv_delay;
+
+  std::vector<node<Ntk>> top_order;
+  std::vector<node_match_t<NtkDest, NInputs>> node_match;
+  std::unordered_map<uint32_t, std::vector<cut_match_t<NtkDest, NInputs>>> matches;
+  network_cuts_t cuts;
+};
+
+} /* namespace detail */
+
+/*! \brief Exact mapping.
+ *
+ * This function implements a mapping algorithm using an exact synthesis database.
+ * It is controlled by a template argument `CutData` (defaulted to
+ * `cut_enumeration_exact_map_cut`). The argument is similar to the `CutData` argument
+ * in `cut_enumeration`, which can specialize the cost function to select priority
+ * cuts and store additional data. The default argument gives priority firstly to
+ * area flow, then delay, and lastly to the cut size.
+ * The type passed as `CutData` must implement the following four fields:
+ *
+ * - `uint32_t delay`
+ * - `float flow`
+ * - `uint8_t match_index`
+ * - `bool ignore`
+ *
+ * See `include/mockturtle/algorithms/cut_enumeration/cut_enumeration_exact_map_cut.hpp`
+ * for one example of a CutData type that implements the cost function that is used in
+ * the technology mapper.
+ *
+ * The function returns a mapped network representation generated using the exact
+ * synthesis entries in the `exact_library`.
+ *
+ * **Required network functions:**
+ * - `size`
+ * - `is_pi`
+ * - `is_constant`
+ * - `node_to_index`
+ * - `index_to_node`
+ * - `get_node`
+ * - `foreach_po`
+ * - `foreach_node`
+ * - `fanout_size`
+ *
+ * \param ntk Network
+ * \param library Exact library
+ * \param ps Mapping params
+ * \param pst Mapping statistics
+ */
+template<class Ntk, class NtkDest = Ntk, class RewritingFn, unsigned NInputs, typename CutData = cut_enumeration_exact_map_cut>
+NtkDest exact_map( Ntk& ntk, exact_library<NtkDest, RewritingFn, NInputs> const& library, map_params const& ps = {}, map_stats* pst = nullptr )
+{
+  static_assert( is_network_type_v<Ntk>, "Ntk is not a network type" );
+  static_assert( has_size_v<Ntk>, "Ntk does not implement the size method" );
+  static_assert( has_is_pi_v<Ntk>, "Ntk does not implement the is_pi method" );
+  static_assert( has_is_constant_v<Ntk>, "Ntk does not implement the is_constant method" );
+  static_assert( has_node_to_index_v<Ntk>, "Ntk does not implement the node_to_index method" );
+  static_assert( has_index_to_node_v<Ntk>, "Ntk does not implement the index_to_node method" );
+  static_assert( has_get_node_v<Ntk>, "Ntk does not implement the get_node method" );
+  static_assert( has_foreach_po_v<Ntk>, "Ntk does not implement the foreach_po method" );
+  static_assert( has_foreach_node_v<Ntk>, "Ntk does not implement the foreach_node method" );
+  static_assert( has_fanout_size_v<Ntk>, "Ntk does not implement the fanout_size method" );
+
+  map_stats st;
+  detail::exact_map_impl<NtkDest, Ntk, RewritingFn, CutData, NInputs> p( ntk, library, ps, st );
+  auto res = p.run();
+
+  st.time_total = st.time_mapping + st.cut_enumeration_st.time_total;
+  if ( ps.verbose )
+  {
+    st.report();
+  }
+
+  if ( pst )
+  {
+    *pst = st;
+  }
+
+  return res;
+}
+
+} /* namespace mockturtle */
diff --git a/include/mockturtle/io/genlib_reader.hpp b/include/mockturtle/io/genlib_reader.hpp
index 4cbad5567..9c30153cd 100644
--- a/include/mockturtle/io/genlib_reader.hpp
+++ b/include/mockturtle/io/genlib_reader.hpp
@@ -62,6 +62,7 @@ struct pin
 
 struct gate
 {
+  unsigned int id;
   std::string name;
   std::string expression;
   uint32_t num_vars;
@@ -115,7 +116,8 @@ class genlib_reader : public lorina::genlib_reader
                            p.input_load, p.max_load,
                            p.rise_block_delay, p.rise_fanout_delay, p.fall_block_delay, p.fall_fanout_delay} );
     }
-    gates.emplace_back( gate{name, expression, num_vars, tt, area, pp} );
+    gates.emplace_back( gate{static_cast<unsigned int>( gates.size() ), name,
+                             expression, num_vars, tt, area, pp} );
   }
 
 protected:
diff --git a/include/mockturtle/utils/tech_library.hpp b/include/mockturtle/utils/tech_library.hpp
new file mode 100644
index 000000000..2cab50ffc
--- /dev/null
+++ b/include/mockturtle/utils/tech_library.hpp
@@ -0,0 +1,556 @@
+/* mockturtle: C++ logic network library
+ * Copyright (C) 2018-2021  EPFL
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*!
+  \file tech_library.hpp
+  \brief Implements utilities to enumerates gates for technology mapping
+
+  \author Alessandro Tempia Calvino
+*/
+
+#pragma once
+
+#include <cassert>
+#include <unordered_map>
+#include <vector>
+
+#include <kitty/constructors.hpp>
+#include <kitty/dynamic_truth_table.hpp>
+#include <kitty/npn.hpp>
+#include <kitty/print.hpp>
+#include <kitty/static_truth_table.hpp>
+
+#include "../io/genlib_reader.hpp"
+
+namespace mockturtle
+{
+
+/*
+std::string const mcnc_library =  "GATE   inv1    1 O=!a;           PIN * INV 1 999 0.9 0.3 0.9 0.3\n"
+                                  "GATE   inv2    2 O=!a;           PIN * INV 2 999 1.0 0.1 1.0 0.1\n"
+                                  "GATE   inv3    3 O=!a;           PIN * INV 3 999 1.1 0.09 1.1 0.09\n"
+                                  "GATE   inv4    4 O=!a;           PIN * INV 4 999 1.2 0.07 1.2 0.07\n"
+                                  "GATE   nand2   2 O=!(ab);        PIN * INV 1 999 1.0 0.2 1.0 0.2\n"
+                                  "GATE   nand3   3 O=!(abc);	      PIN * INV 1 999 1.1 0.3 1.1 0.3\n"
+                                  "GATE   nand4   4 O=!(abcd);      PIN * INV 1 999 1.4 0.4 1.4 0.4\n"
+                                  "GATE   nor2    2 O=!{ab};        PIN * INV 1 999 1.4 0.5 1.4 0.5\n"
+                                  "GATE   nor3    3 O=!{abc};       PIN * INV 1 999 2.4 0.7 2.4 0.7\n"
+                                  "GATE   nor4    4 O=!{abcd};      PIN * INV 1 999 3.8 1.0 3.8 1.0\n"
+                                  "GATE   and2    3 O=(ab);         PIN * NONINV 1 999 1.9 0.3 1.9 0.3\n"
+                                  "GATE   or2     3 O={ab};         PIN * NONINV 1 999 2.4 0.3 2.4 0.3\n"
+                                  "GATE   xor2a   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "#GATE  xor2b   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "GATE   xnor2a  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "#GATE  xnor2b  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "GATE   aoi21   3 O=!{(ab)c};     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   aoi22   4 O=!{(ab)(cd)};  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   oai21   3 O=!({ab}c);     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   oai22   4 O=!({ab}{cd});  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   buf     2 O=a;            PIN * NONINV 1 999 1.0 0.0 1.0 0.0\n"
+                                  "GATE   zero    0 O=0;\n"
+                                  "GATE   one     0 O=1;";
+*/
+
+struct tech_library_params
+{
+  /*! \brief reports np enumerations */
+  bool verbose{ false };
+
+  /*! \brief reports all the entries in the library */
+  bool very_verbose{ false };
+};
+
+template<unsigned NInputs>
+struct supergate
+{
+  struct gate const* root{};
+
+  /* area */
+  float area{ 0 };
+  /* worst delay */
+  float worstDelay{ 0 };
+  /* pin-to-pin delay */
+  std::array<float, NInputs> tdelay{};
+
+  /* np permutation vector */
+  std::vector<uint8_t> permutation{};
+
+  /* pin negations */
+  uint8_t polarity{ 0 };
+};
+
+/*! \brief Library of np-enumerated gates
+ *
+ * This class creates a technology library from a set
+ * of input gates. Each NP-configuration of each gate
+ * is enumerated and inserted in the library.
+ *
+   \verbatim embed:rst
+
+   Example
+
+   .. code-block:: c++
+
+      std::vector<gate> gates;
+      lorina::read_genlib( "file.lib", genlib_reader( gates ) );
+      mockturtle::tech_library lib( gates );
+   \endverbatim
+ */
+template<unsigned NInputs = 5u>
+class tech_library
+{
+  using supergates_list_t = std::vector<supergate<NInputs>>;
+  using tt_hash = kitty::hash<kitty::static_truth_table<NInputs>>;
+  using lib_t = std::unordered_map<kitty::static_truth_table<NInputs>, supergates_list_t, tt_hash>;
+
+public:
+  tech_library( std::vector<gate> const& gates, tech_library_params const ps = {} )
+      : _gates( gates ),
+        _ps( ps ),
+        _super_lib()
+  {
+    generate_library();
+  }
+
+  const supergates_list_t* get_supergates( kitty::static_truth_table<NInputs> const& tt ) const
+  {
+    auto match = _super_lib.find( tt );
+    if ( match != _super_lib.end() )
+      return &match->second;
+    return nullptr;
+  }
+
+  const std::tuple<float, float, uint32_t> get_inverter_info() const
+  {
+    return std::make_tuple( _inv_area, _inv_delay, _inv_id );
+  }
+
+  unsigned max_gate_size()
+  {
+    return _max_size;
+  }
+
+  const std::vector<gate> get_gates() const
+  {
+    return _gates;
+  }
+
+private:
+  void generate_library()
+  {
+    bool inv = false;
+
+    for ( auto& gate : _gates )
+    {
+      if ( gate.function.num_vars() > NInputs )
+      {
+        std::cerr << "[i] WARNING: gate " << gate.name << " IGNORED, too many variables for the library settings" << std::endl;
+        continue;
+      }
+
+      float worst_delay = compute_worst_delay( gate );
+
+      if ( gate.function.num_vars() == 1 )
+      {
+        /* extract inverter delay and area */
+        if ( kitty::is_const0( kitty::cofactor1( gate.function, 0 ) ) )
+        {
+          /* get the smallest area inverter */
+          if ( !inv || gate.area < _inv_area )
+          {
+            _inv_area = gate.area;
+            _inv_delay = worst_delay;
+            _inv_id = gate.id;
+            inv = true;
+          }
+        }
+      }
+
+      _max_size = std::max( _max_size, gate.num_vars );
+
+      uint32_t np_count = 0;
+
+      const auto on_np = [&]( auto const& tt, auto neg, auto const& perm ) {
+        supergate<NInputs> sg;
+        sg.root = &gate;
+        sg.area = gate.area;
+        sg.worstDelay = worst_delay;
+        sg.polarity = 0;
+        sg.permutation = perm;
+
+        for ( auto i = 0u; i < perm.size() && i < NInputs; ++i )
+        {
+          sg.tdelay[i] = worst_delay;                     /* if pin-to-pin delay change to: gate.delay[perm[i]] */
+          sg.polarity |= ( ( neg >> perm[i] ) & 1 ) << i; /* permutate input negation to match the right pin */
+        }
+        for ( auto i = perm.size(); i < NInputs; ++i )
+        {
+          sg.tdelay[i] = 0; /* added for completeness but not necessary */
+        }
+
+        const auto static_tt = kitty::extend_to<NInputs>( tt );
+
+        auto& v = _super_lib[static_tt];
+
+        /* ordered insert by ascending area and number of input pins */
+        auto it = std::lower_bound( v.begin(), v.end(), sg, [&]( auto const& s1, auto const& s2 ) {
+          if ( s1.area < s2.area )
+            return true;
+          if ( s1.area > s2.area )
+            return false;
+          if ( s1.root->num_vars < s2.root->num_vars )
+            return true;
+          if ( s1.root->num_vars > s2.root->num_vars )
+            return true;
+          return s1.root->id < s2.root->id;
+        } );
+
+        bool to_add = true;
+        /* search for duplicated element due to symmetries */
+        while ( it != v.end() )
+        {
+          if ( sg.root->id == it->root->id )
+          {
+            /* if already in the library exit, else ignore permutations if with equal delay cost */
+            if ( sg.polarity == it->polarity && sg.tdelay == it->tdelay )
+            {
+              to_add = false;
+              break;
+            }
+          }
+          else
+          {
+            break;
+          }
+          ++it;
+        }
+
+        if ( to_add )
+        {
+          v.insert( it, sg );
+          ++np_count;
+        }
+
+        /* check correct results */
+        // assert( gate.function == create_from_npn_config( std::make_tuple( tt, neg, sg.permutation ) ) );
+      };
+
+      /* NP enumeration of the function */
+      const auto tt = gate.function;
+      kitty::exact_np_enumeration( tt, on_np );
+
+      if ( _ps.verbose )
+      {
+        std::cout << "Gate " << gate.name << ", num_vars = " << gate.num_vars << ", np entries = " << np_count << std::endl;
+      }
+    }
+
+    if ( !inv )
+    {
+      std::cerr << "[i] WARNING: inverter gate has not been detected in the library" << std::endl;
+    }
+
+    if ( _ps.very_verbose )
+    {
+      for ( auto const& entry : _super_lib )
+      {
+        kitty::print_hex( entry.first );
+        std::cout << ": ";
+        for ( auto const& gate : entry.second )
+        {
+          printf( "%s(d:%.2f, a:%.2f, p:%d) ", gate.root->name.c_str(), gate.worstDelay, gate.area, gate.polarity );
+        }
+        std::cout << std::endl;
+      }
+    }
+  }
+
+  float compute_worst_delay( gate const& g )
+  {
+    float worst_delay = 0.0f;
+
+    /* consider only block_delay */
+    for ( auto const& pin : g.pins )
+    {
+      float worst_pin_delay = static_cast<float>( std::max( pin.rise_block_delay, pin.fall_block_delay ) );
+      worst_delay = std::max( worst_delay, worst_pin_delay );
+    }
+    return worst_delay;
+  }
+
+private:
+  /* inverter info */
+  float _inv_area{ 0.0 };
+  float _inv_delay{ 0.0 };
+  uint32_t _inv_id{ UINT32_MAX };
+
+  unsigned _max_size{ 0 }; /* max #fanins of the gates in the library */
+
+  std::vector<gate> const _gates; /* collection of gates */
+  tech_library_params const _ps;
+  lib_t _super_lib; /* library of enumerated gates */
+};
+
+template<typename Ntk, unsigned NInputs>
+struct exact_supergate
+{
+  signal<Ntk> const root;
+
+  /* number of inputs of the supergate */
+  uint8_t n_inputs{ 0 };
+  /* saved polarities for inputs and/or outputs */
+  uint8_t polarity{ 0 };
+
+  /* area */
+  float area{ 0 };
+  /* worst delay */
+  float worstDelay{ 0 };
+  /* pin-to-pin delay */
+  std::array<float, NInputs> tdelay{ 0 };
+
+  exact_supergate( signal<Ntk> const root )
+      : root( root ) {}
+};
+
+struct exact_library_params
+{
+  /* area of a gate */
+  float area_gate{ 1.0f };
+  /* area of an inverter */
+  float area_inverter{ 0.0f };
+  /* delay of a gate */
+  float delay_gate{ 1.0f };
+  /* delay of an inverter */
+  float delay_inverter{ 0.0f };
+
+  /* classify in NP instead of NPN */
+  bool np_classification{ true };
+  /* verbose */
+  bool verbose{ false };
+};
+
+/*! \brief Library of exact synthesis supergates
+ *
+ * This class creates a technology library from an exact
+ * synthesis database. Each NPN-entry in the database is
+ * stored in its NP class by removing the output inverter
+ * if present. The class creates supergates from the
+ * database computing area and delay information.
+ *
+   \verbatim embed:rst
+
+   Example
+
+   .. code-block:: c++
+
+      mockturtle::mig_npn_resynthesis mig_resyn{true};
+      mockturtle::exact_library<mockturtle::mig_network, mockturtle::mig_npn_resynthesis, 4> lib( mig_resyn );
+   \endverbatim
+ */
+template<typename Ntk, class RewritingFn, unsigned NInputs = 4u>
+class exact_library
+{
+  using supergates_list_t = std::vector<exact_supergate<Ntk, NInputs>>;
+  using tt_hash = kitty::hash<kitty::static_truth_table<NInputs>>;
+  using lib_t = std::unordered_map<kitty::static_truth_table<NInputs>, supergates_list_t, tt_hash>;
+
+public:
+  exact_library( RewritingFn const& rewriting_fn, exact_library_params const& ps = {} )
+      : _database(),
+        _rewriting_fn( rewriting_fn ),
+        _ps( ps ),
+        _super_lib()
+  {
+    generate_library();
+  }
+
+  const supergates_list_t* get_supergates( kitty::static_truth_table<NInputs> const& tt ) const
+  {
+    auto match = _super_lib.find( tt );
+    if ( match != _super_lib.end() )
+      return &match->second;
+    return nullptr;
+  }
+
+  const Ntk& get_database() const
+  {
+    return _database;
+  }
+
+  const std::tuple<float, float> get_inverter_info() const
+  {
+    return std::make_pair( _ps.area_inverter, _ps.delay_inverter );
+  }
+
+private:
+  void generate_library()
+  {
+    std::vector<signal<Ntk>> pis;
+    for ( auto i = 0u; i < NInputs; ++i )
+    {
+      pis.push_back( _database.create_pi() );
+    }
+
+    /* Compute NPN classes */
+    std::unordered_set<kitty::static_truth_table<NInputs>, tt_hash> classes;
+    kitty::static_truth_table<NInputs> tt;
+    do
+    {
+      const auto res = kitty::exact_npn_canonization( tt );
+      classes.insert( std::get<0>( res ) );
+      kitty::next_inplace( tt );
+    } while ( !kitty::is_const0( tt ) );
+
+    /* Constuct supergates */
+    for ( auto const& entry : classes )
+    {
+      supergates_list_t supergates_pos;
+      supergates_list_t supergates_neg;
+      auto const not_entry = ~entry;
+
+      const auto add_supergate = [&]( auto const& f_new ) {
+        bool complemented = _database.is_complemented( f_new );
+        auto f = f_new;
+        if ( _ps.np_classification && complemented )
+        {
+          f = !f;
+        }
+        exact_supergate<Ntk, NInputs> sg( f );
+        compute_info( sg );
+        if ( _ps.np_classification && complemented )
+        {
+          supergates_neg.push_back( sg );
+        }
+        else
+        {
+          supergates_pos.push_back( sg );
+        }
+        _database.create_po( f );
+        return true;
+      };
+
+      kitty::dynamic_truth_table function = kitty::extend_to( entry, NInputs );
+      _rewriting_fn( _database, function, pis.begin(), pis.end(), add_supergate );
+      if ( supergates_pos.size() > 0 )
+        _super_lib.insert( { entry, supergates_pos } );
+      if ( _ps.np_classification && supergates_neg.size() > 0 )
+        _super_lib.insert( { not_entry, supergates_neg } );
+    }
+
+    if ( _ps.verbose )
+    {
+      std::cout << "Classified in " << _super_lib.size() << " entries" << std::endl;
+      for ( auto const& pair : _super_lib )
+      {
+        kitty::print_hex( pair.first );
+        std::cout << ": ";
+
+        for ( auto const& gate : pair.second )
+        {
+          printf( "%.2f,%.2f,%d,%d,:", gate.worstDelay, gate.area, gate.polarity, gate.n_inputs );
+          for ( auto j = 0u; j < NInputs; ++j )
+            printf( "%.2f/", gate.tdelay[j] );
+          std::cout << " ";
+        }
+        std::cout << std::endl;
+      }
+    }
+  }
+
+  /* Computes delay and area info */
+  void compute_info( exact_supergate<Ntk, NInputs>& sg )
+  {
+    _database.incr_trav_id();
+    /* info does not consider input and output inverters */
+    bool compl_root = _database.is_complemented( sg.root );
+    auto const root = compl_root ? !sg.root : sg.root;
+    sg.area = compute_info_rec( sg, root, 0.0f );
+
+    /* output polarity */
+    sg.polarity |= ( unsigned( compl_root ) ) << NInputs;
+    /* number of inputs */
+    for ( auto i = 0u; i < NInputs; ++i )
+    {
+      sg.tdelay[i] *= -1; /* invert to positive value */
+      if ( sg.tdelay[i] != 0.0f )
+        sg.n_inputs++;
+    }
+    sg.worstDelay *= -1;
+  }
+
+  float compute_info_rec( exact_supergate<Ntk, NInputs>& sg, signal<Ntk> const& root, float delay )
+  {
+    auto n = _database.get_node( root );
+
+    if ( _database.is_constant( n ) )
+      return 0.0f;
+
+    float area = 0.0f;
+    float tdelay = delay;
+
+    if ( _database.is_pi( n ) )
+    {
+      sg.tdelay[_database.index_to_node( n ) - 1u] = std::min( sg.tdelay[_database.index_to_node( n ) - 1u], tdelay );
+      sg.worstDelay = std::min( sg.worstDelay, tdelay );
+      sg.polarity |= ( unsigned( _database.is_complemented( root ) ) ) << ( _database.index_to_node( n ) - 1u );
+      return area;
+    }
+
+    tdelay -= _ps.delay_gate;
+
+    /* add gate area once */
+    if ( _database.visited( n ) != _database.trav_id() )
+    {
+      area += _ps.area_gate;
+      _database.set_value( n, 0u );
+      _database.set_visited( n, _database.trav_id() );
+    }
+
+    if ( _database.is_complemented( root ) )
+    {
+      tdelay -= _ps.delay_inverter;
+      /* add inverter area only once (shared by fanout) */
+      if ( _database.value( n ) == 0u )
+      {
+        area += _ps.area_inverter;
+        _database.set_value( n, 1u );
+      }
+    }
+
+    _database.foreach_fanin( n, [&]( auto const& child ) {
+      area += compute_info_rec( sg, child, tdelay );
+    } );
+
+    return area;
+  }
+
+private:
+  Ntk _database;
+  RewritingFn const& _rewriting_fn;
+  exact_library_params const& _ps;
+  lib_t _super_lib;
+};
+
+} // namespace mockturtle
diff --git a/lib/kitty/kitty/npn.hpp b/lib/kitty/kitty/npn.hpp
index e3a654e8b..29460ff15 100755
--- a/lib/kitty/kitty/npn.hpp
+++ b/lib/kitty/kitty/npn.hpp
@@ -542,6 +542,89 @@ std::tuple<TT, uint32_t, std::vector<uint8_t>> sifting_p_canonization( const TT&
   return std::make_tuple( npn, phase, perm );
 }
 
+/*! \brief Exact NP enumeration
+
+  Given a truth table, this function enumerates all the functions in its
+  NP class. Two functions are in the same NP class, if one can be obtained
+  from the other by input negation and input permutation.
+
+  The function takes a callback as second parameter which is called for
+  every enumerated function. The callback should take as parameters:
+  - NP-enumerated truth table
+  - input negations
+  - input permutation to apply
+
+  \param tt Truth table
+  \param fn Callback for each enumerated truth table in the NP class
+*/
+template<typename TT, typename Callback>
+void exact_np_enumeration( const TT& tt, Callback&& fn )
+{
+  static_assert( is_complete_truth_table<TT>::value, "Can only be applied on complete truth tables." );
+
+  const auto num_vars = tt.num_vars();
+
+  /* Special case for n = 0 */
+  if ( num_vars == 0 )
+  {
+    fn( tt, 0u, std::vector<uint8_t>{} );
+    return;
+  }
+
+  /* Special case for n = 1 */
+  if ( num_vars == 1 )
+  {
+    fn( tt, 0u, std::vector<uint8_t>{0} );
+    return;
+  }
+
+  assert( num_vars >= 2 && num_vars <= 6 );
+
+  auto t1 = tt;
+
+  std::vector<uint8_t> perm( num_vars );
+  std::iota( perm.begin(), perm.end(), 0u );
+
+  uint32_t phase = 0;
+
+  fn( t1, phase, perm );
+
+  const auto& swaps = detail::swaps[num_vars - 2u];
+  const auto& flips = detail::flips[num_vars - 2u];
+
+  for ( std::size_t i = 0; i < swaps.size(); ++i )
+  {
+    const auto pos = swaps[i];
+    swap_adjacent_inplace( t1, pos );
+
+    std::swap( perm[pos], perm[pos + 1] );
+
+    fn( t1, phase, perm );
+  }
+
+  for ( std::size_t j = 0; j < flips.size(); ++j )
+  {
+    const auto pos = flips[j];
+    swap_adjacent_inplace( t1, 0 );
+    flip_inplace( t1, pos );
+
+    std::swap( perm[0], perm[1] );
+    phase ^= 1 << perm[pos];
+
+    fn( t1, phase, perm );
+
+    for ( std::size_t i = 0; i < swaps.size(); ++i )
+    {
+      const auto pos = swaps[i];
+      swap_adjacent_inplace( t1, pos );
+
+      std::swap( perm[pos], perm[pos + 1] );
+
+      fn( t1, phase, perm );
+    }
+  }
+}
+
 /*! \brief Obtain truth table from NPN configuration
 
   Given an NPN configuration, which contains a representative
diff --git a/test/algorithms/mapper.cpp b/test/algorithms/mapper.cpp
new file mode 100644
index 000000000..c92dc860b
--- /dev/null
+++ b/test/algorithms/mapper.cpp
@@ -0,0 +1,344 @@
+#include <catch.hpp>
+
+#include <cstdint>
+#include <vector>
+
+#include <mockturtle/algorithms/mapper.hpp>
+#include <mockturtle/algorithms/node_resynthesis/mig_npn.hpp>
+#include <mockturtle/algorithms/node_resynthesis/xmg_npn.hpp>
+#include <mockturtle/algorithms/node_resynthesis/xag_npn.hpp>
+#include <mockturtle/generators/arithmetic.hpp>
+#include <mockturtle/io/genlib_reader.hpp>
+#include <mockturtle/utils/tech_library.hpp>
+#include <mockturtle/networks/aig.hpp>
+#include <mockturtle/networks/mig.hpp>
+#include <mockturtle/networks/xmg.hpp>
+#include <mockturtle/networks/xag.hpp>
+#include <mockturtle/networks/klut.hpp>
+#include <lorina/genlib.hpp>
+
+
+
+using namespace mockturtle;
+
+std::string const test_library =  "GATE   inv1    1 O=!a;     PIN * INV 1 999 0.9 0.3 0.9 0.3\n"
+                                  "GATE   inv2    2 O=!a;     PIN * INV 2 999 1.0 0.1 1.0 0.1\n"
+                                  "GATE   nand2   2 O=!(ab);  PIN * INV 1 999 1.0 0.2 1.0 0.2\n"
+                                  "GATE   xor2    5 O=[ab];   PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "GATE   mig3    3 O=<abc>;  PIN * INV 1 999 2.0 0.2 2.0 0.2\n"
+                                  "GATE   buf     2 O=a;      PIN * NONINV 1 999 1.0 0.0 1.0 0.0\n"
+                                  "GATE   zero    0 O=0;\n"
+                                  "GATE   one     0 O=1;";
+
+
+TEST_CASE( "Map of MAJ3", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto f = aig.create_maj( a, b, c );
+  aig.create_po( f );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  CHECK( luts.size() == 6u );
+  CHECK( luts.num_pis() == 3u );
+  CHECK( luts.num_pos() == 1u );
+  CHECK( luts.num_gates() == 1u );
+  CHECK( st.area == 3.0f );
+  CHECK( st.delay == 2.0f );
+}
+
+TEST_CASE( "Map of bad MAJ3 and constant output", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto f = aig.create_maj( a, aig.create_maj( a, b, c ), c );
+  aig.create_po( f );
+  aig.create_po( aig.get_constant( true ) );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  CHECK( luts.size() == 6u );
+  CHECK( luts.num_pis() == 3u );
+  CHECK( luts.num_pos() == 2u );
+  CHECK( luts.num_gates() == 1u );
+  CHECK( st.area == 3.0f );
+  CHECK( st.delay == 2.0f );
+}
+
+TEST_CASE( "Map of full adder", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto [sum, carry] = full_adder( aig, a, b, c );
+  aig.create_po( sum );
+  aig.create_po( carry );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  const float eps{0.005f};
+
+  CHECK( luts.size() == 8u );
+  CHECK( luts.num_pis() == 3u );
+  CHECK( luts.num_pos() == 2u );
+  CHECK( luts.num_gates() == 3u );
+  CHECK( st.area > 13.0f - eps );
+  CHECK( st.area < 13.0f + eps );
+  CHECK( st.delay > 3.8f - eps );
+  CHECK( st.delay < 3.8f + eps );
+}
+
+TEST_CASE( "Map with inverters", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto f1 = aig.create_and( !a, b );
+  const auto f2 = aig.create_and( f1, !c );
+
+  aig.create_po( f2 );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  const float eps{0.005f};
+
+  CHECK( luts.size() == 11u );
+  CHECK( luts.num_pis() == 3u );
+  CHECK( luts.num_pos() == 1u );
+  CHECK( luts.num_gates() == 6u );
+  CHECK( st.area > 8.0f - eps );
+  CHECK( st.area < 8.0f + eps );
+  CHECK( st.delay > 4.7f - eps );
+  CHECK( st.delay < 4.7f + eps );
+}
+
+TEST_CASE( "Map for inverters minimization", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto f = aig.create_maj( !a, !b, !c );
+  aig.create_po( f );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  const float eps{0.005f};
+
+  CHECK( luts.size() == 7u );
+  CHECK( luts.num_pis() == 3u );
+  CHECK( luts.num_pos() == 1u );
+  CHECK( luts.num_gates() == 2u );
+  CHECK( st.area > 4.0f - eps );
+  CHECK( st.area < 4.0f + eps );
+  CHECK( st.delay > 2.9f - eps );
+  CHECK( st.delay < 2.9f + eps );
+}
+
+TEST_CASE( "Map of buffer and constant outputs", "[mapper]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<3> lib( gates );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+  const auto d = aig.create_pi();
+
+  const auto n5 = aig.create_and( a, d );
+  const auto n6 = aig.create_and( a, !c );
+  const auto n7 = aig.create_and( !c, n5 );
+  const auto n8 = aig.create_and( c, n6 );
+  const auto n9 = aig.create_and( !n6, n7 );
+  const auto n10 = aig.create_and( n7, n8 );
+  const auto n11 = aig.create_and( a, n10 );
+  const auto n12 = aig.create_and( !d, n11 );
+  const auto n13 = aig.create_and( !d, !n7 );
+  const auto n14 = aig.create_and( !n6, !n7 );
+
+  aig.create_po( aig.get_constant( true ) );
+  aig.create_po( b );
+  aig.create_po( n9 );
+  aig.create_po( n12 );
+  aig.create_po( !n13 );
+  aig.create_po( n14 );
+
+  map_params ps;
+  map_stats st;
+  klut_network luts = tech_map( aig, lib, ps, &st );
+
+  const float eps{0.005f};
+
+  CHECK( luts.size() == 9u );
+  CHECK( luts.num_pis() == 4u );
+  CHECK( luts.num_pos() == 6u );
+  CHECK( luts.num_gates() == 3u );
+  CHECK( st.area > 5.0f - eps );
+  CHECK( st.area < 5.0f + eps );
+  CHECK( st.delay > 1.9f - eps );
+  CHECK( st.delay < 1.9f + eps );
+}
+
+TEST_CASE( "Exact map of bad MAJ3 and constant output", "[mapper]" )
+{
+  mig_npn_resynthesis resyn{true};
+
+  exact_library<mig_network, mig_npn_resynthesis>  lib( resyn );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto f = aig.create_maj( a, aig.create_maj( a, b, c ), c );
+  aig.create_po( f );
+  aig.create_po( aig.get_constant( true ) );
+
+  map_params ps;
+  map_stats st;
+  mig_network mig = exact_map( aig, lib, ps, &st );
+
+  CHECK( mig.size() == 5u );
+  CHECK( mig.num_pis() == 3u );
+  CHECK( mig.num_pos() == 2u );
+  CHECK( mig.num_gates() == 1u );
+  CHECK( st.area == 1.0f );
+  CHECK( st.delay == 1.0f );
+}
+
+TEST_CASE( "Exact map of full adder", "[mapper]" )
+{
+  xmg_npn_resynthesis resyn;
+
+  exact_library<xmg_network, xmg_npn_resynthesis>  lib( resyn );
+
+  aig_network aig;
+  const auto a = aig.create_pi();
+  const auto b = aig.create_pi();
+  const auto c = aig.create_pi();
+
+  const auto [sum, carry] = full_adder( aig, a, b, c );
+  aig.create_po( sum );
+  aig.create_po( carry );
+
+  map_params ps;
+  map_stats st;
+  xmg_network xmg = exact_map( aig, lib, ps, &st );
+
+  CHECK( xmg.size() == 7u );
+  CHECK( xmg.num_pis() == 3u );
+  CHECK( xmg.num_pos() == 2u );
+  CHECK( xmg.num_gates() == 3u );
+  CHECK( st.area == 3.0f );
+  CHECK( st.delay == 2.0f );
+}
+
+TEST_CASE( "Exact map should avoid cycles", "[mapping]" )
+{
+  using resyn_fn = xag_npn_resynthesis<aig_network>;
+
+  resyn_fn resyn;
+
+  exact_library<aig_network, resyn_fn>  lib( resyn );
+
+  aig_network aig;
+  const auto x0 = aig.create_pi();
+  const auto x1 = aig.create_pi();
+  const auto x2 = aig.create_pi();
+
+  const auto n0 = aig.create_and( x1, !x2 );
+  const auto n1 = aig.create_and( !x0, n0 );
+  const auto n2 = aig.create_and( x0, !n0 );
+  const auto n3 = aig.create_and( !n1, !n2 );
+  const auto n4 = aig.create_and( x1, x2 );
+  const auto n5 = aig.create_and( x0, !n4 );
+  const auto n6 = aig.create_and( !x0, n4 );
+  const auto n7 = aig.create_and( !n5, !n6 );
+  aig.create_po( n3 );
+  aig.create_po( n7 );
+  
+  map_params ps;
+  map_stats st;
+  aig_network res = exact_map( aig, lib, ps, &st );
+  
+  CHECK( res.size() == 12 );
+  CHECK( res.num_pis() == 3 );
+  CHECK( res.num_pos() == 2 );
+  CHECK( res.num_gates() == 8 );
+  CHECK( st.area == 8.0f );
+  CHECK( st.delay == 3.0f );
+}
\ No newline at end of file
diff --git a/test/io/genlib_reader.cpp b/test/io/genlib_reader.cpp
index 135f9a48d..9fe02e23c 100644
--- a/test/io/genlib_reader.cpp
+++ b/test/io/genlib_reader.cpp
@@ -25,6 +25,7 @@ TEST_CASE( "read genlib file", "[genlib_reader]" )
   CHECK( result == lorina::return_code::success );
 
   CHECK( gates.size() == 5u );
+  CHECK( gates[0u].id == 0u );
   CHECK( gates[0u].name == "zero" );
   CHECK( gates[0u].expression == "0" );
   CHECK( gates[0u].function._bits[0] == 0 );
@@ -32,6 +33,7 @@ TEST_CASE( "read genlib file", "[genlib_reader]" )
   CHECK( gates[0u].area == 0.0 );
   CHECK( gates[0u].pins.empty() );
 
+  CHECK( gates[1u].id == 1u );
   CHECK( gates[1u].name == "one" );
   CHECK( gates[1u].expression == "1" );
   CHECK( gates[1u].function._bits[0] == 1 );
@@ -39,6 +41,7 @@ TEST_CASE( "read genlib file", "[genlib_reader]" )
   CHECK( gates[1u].area == 0.0 );
   CHECK( gates[1u].pins.empty() );
 
+  CHECK( gates[2u].id == 2u );
   CHECK( gates[2u].name == "inverter" );
   CHECK( gates[2u].expression == "!a" );
   CHECK( gates[2u].function._bits[0] == 1 );
@@ -54,6 +57,7 @@ TEST_CASE( "read genlib file", "[genlib_reader]" )
   CHECK( gates[2u].pins[0u].rise_block_delay == 1.0 );
   CHECK( gates[2u].pins[0u].rise_fanout_delay == 1.0 );
 
+  CHECK( gates[3u].id == 3u );
   CHECK( gates[3u].name == "buffer" );
   CHECK( gates[3u].expression == "a" );
   CHECK( gates[3u].function._bits[0] == 2 );
@@ -70,6 +74,7 @@ TEST_CASE( "read genlib file", "[genlib_reader]" )
   CHECK( gates[2u].pins[0u].rise_block_delay == 1.0 );
   CHECK( gates[2u].pins[0u].rise_fanout_delay == 1.0 );
 
+  CHECK( gates[4u].id == 4u );
   CHECK( gates[4u].name == "and" );
   CHECK( gates[4u].expression == "(ab)" );
   CHECK( gates[4u].function._bits[0] == 8 );
diff --git a/test/utils/tech_library.cpp b/test/utils/tech_library.cpp
new file mode 100644
index 000000000..2b23f306e
--- /dev/null
+++ b/test/utils/tech_library.cpp
@@ -0,0 +1,162 @@
+#include <catch.hpp>
+
+#include <cstdint>
+#include <vector>
+
+#include <lorina/genlib.hpp>
+#include <mockturtle/io/genlib_reader.hpp>
+#include <mockturtle/utils/tech_library.hpp>
+
+#include <kitty/constructors.hpp>
+#include <kitty/dynamic_truth_table.hpp>
+#include <kitty/static_truth_table.hpp>
+#include <kitty/npn.hpp>
+
+using namespace mockturtle;
+
+std::string const simple_test_library = "GATE   inv1    1 O=!a;     PIN * INV 1 999 0.9 0.3 0.9 0.3\n"
+                                        "GATE   inv2    2 O=!a;     PIN * INV 2 999 1.0 0.1 1.0 0.1\n"
+                                        "GATE   nand2   2 O=!(ab);  PIN * INV 1 999 1.0 0.2 1.0 0.2\n";
+
+std::string const test_library =  "GATE   inv1    3 O=!a;           PIN * INV 3 999 1.1 0.09 1.1 0.09\n"
+                                  "GATE   inv2    2 O=!a;           PIN * INV 2 999 1.0 0.1 1.0 0.1\n"
+                                  "GATE   inv3    1 O=!a;           PIN * INV 1 999 0.9 0.3 0.9 0.3\n"
+                                  "GATE   inv4    4 O=!a;           PIN * INV 4 999 1.2 0.07 1.2 0.07\n"
+                                  "GATE   nand2   2 O=!(ab);        PIN * INV 1 999 1.0 0.2 1.0 0.2\n"
+                                  "GATE   nand3   3 O=!(abc);	      PIN * INV 1 999 1.1 0.3 1.1 0.3\n"
+                                  "GATE   nand4   4 O=!(abcd);      PIN * INV 1 999 1.4 0.4 1.4 0.4\n"
+                                  "GATE   nor2    2 O=!{ab};        PIN * INV 1 999 1.4 0.5 1.4 0.5\n"
+                                  "GATE   nor3    3 O=!{abc};       PIN * INV 1 999 2.4 0.7 2.4 0.7\n"
+                                  "GATE   nor4    4 O=!{abcd};      PIN * INV 1 999 3.8 1.0 3.8 1.0\n"
+                                  "GATE   and2    3 O=(ab);         PIN * NONINV 1 999 1.9 0.3 1.9 0.3\n"
+                                  "GATE   or2     3 O={ab};         PIN * NONINV 1 999 2.4 0.3 2.4 0.3\n"
+                                  "GATE   xor2a   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "#GATE  xor2b   5 O=[ab];         PIN * UNKNOWN 2 999 1.9 0.5 1.9 0.5\n"
+                                  "GATE   xnor2a  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "#GATE  xnor2b  5 O=![ab];        PIN * UNKNOWN 2 999 2.1 0.5 2.1 0.5\n"
+                                  "GATE   aoi21   3 O=!{(ab)c};     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   aoi22   4 O=!{(ab)(cd)};  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   oai21   3 O=!({ab}c);     PIN * INV 1 999 1.6 0.4 1.6 0.4\n"
+                                  "GATE   oai22   4 O=!({ab}{cd});  PIN * INV 1 999 2.0 0.4 2.0 0.4\n"
+                                  "GATE   buf     2 O=a;            PIN * NONINV 1 999 1.0 0.0 1.0 0.0\n"
+                                  "GATE   zero    0 O=0;\n"
+                                  "GATE   one     0 O=1;";
+
+TEST_CASE( "Simple library generation", "[tech_library]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( simple_test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<2> lib( gates );
+
+  CHECK( lib.max_gate_size() == 2 );
+  CHECK( lib.get_inverter_info() == std::make_tuple( 1.0f, 0.9f, 0u ) );
+
+  kitty::static_truth_table<2> tt;
+
+  kitty::create_from_hex_string( tt, "5" );
+  auto const inv = lib.get_supergates( tt );
+  CHECK( inv != nullptr );
+  CHECK( inv->size() == 2 );
+  CHECK( ( *inv )[0].root->name == "inv1" );
+  CHECK( ( *inv )[0].area == 1.0f );
+  CHECK( ( *inv )[0].worstDelay == 0.9f );
+  CHECK( ( *inv )[0].tdelay[0] == 0.9f );
+  CHECK( ( *inv )[0].polarity == 0u );
+  CHECK( ( *inv )[1].root->name == "inv2" );
+  CHECK( ( *inv )[1].area == 2.0f );
+  CHECK( ( *inv )[1].worstDelay == 1.0f );
+  CHECK( ( *inv )[1].tdelay[0] == 1.0f );
+  CHECK( ( *inv )[1].polarity == 0u );
+
+  kitty::create_from_hex_string( tt, "7" );
+  auto const nand_7 = lib.get_supergates( tt );
+  CHECK( nand_7 != nullptr );
+  CHECK( nand_7->size() == 1 );
+  CHECK( ( *nand_7 )[0].root->name == "nand2" );
+  CHECK( ( *nand_7 )[0].area == 2.0f );
+  CHECK( ( *nand_7 )[0].worstDelay == 1.0f );
+  CHECK( ( *nand_7 )[0].tdelay[0] == 1.0f );
+  CHECK( ( *nand_7 )[0].tdelay[1] == 1.0f );
+  CHECK( ( *nand_7 )[0].polarity == 0u );
+
+  kitty::create_from_hex_string( tt, "b" );
+  auto const nand_b = lib.get_supergates( tt );
+  CHECK( nand_b != nullptr );
+  CHECK( nand_b->size() == 1 );
+  CHECK( ( *nand_b )[0].root->name == "nand2" );
+  CHECK( ( *nand_b )[0].area == 2.0f );
+  CHECK( ( *nand_b )[0].worstDelay == 1.0f );
+  CHECK( ( *nand_b )[0].tdelay[0] == 1.0f );
+  CHECK( ( *nand_b )[0].tdelay[1] == 1.0f );
+  CHECK( ( *nand_b )[0].polarity == 1u );
+
+  kitty::create_from_hex_string( tt, "d" );
+  auto const nand_d = lib.get_supergates( tt );
+  CHECK( nand_d != nullptr );
+  CHECK( nand_d->size() == 1 );
+  CHECK( ( *nand_d )[0].root->name == "nand2" );
+  CHECK( ( *nand_d )[0].area == 2.0f );
+  CHECK( ( *nand_d )[0].worstDelay == 1.0f );
+  CHECK( ( *nand_d )[0].tdelay[0] == 1.0f );
+  CHECK( ( *nand_d )[0].tdelay[1] == 1.0f );
+  CHECK( ( *nand_d )[0].polarity == 2u );
+
+  kitty::create_from_hex_string( tt, "e" );
+  auto const nand_e = lib.get_supergates( tt );
+  CHECK( nand_e != nullptr );
+  CHECK( nand_e->size() == 1 );
+  CHECK( ( *nand_e )[0].root->name == "nand2" );
+  CHECK( ( *nand_e )[0].area == 2.0f );
+  CHECK( ( *nand_e )[0].worstDelay == 1.0f );
+  CHECK( ( *nand_e )[0].tdelay[0] == 1.0f );
+  CHECK( ( *nand_e )[0].tdelay[1] == 1.0f );
+  CHECK( ( *nand_e )[0].polarity == 3u );
+}
+
+TEST_CASE( "Complete library generation", "[tech_library]" )
+{
+  std::vector<gate> gates;
+
+  std::istringstream in( test_library );
+  auto result = lorina::read_genlib( in, genlib_reader( gates ) );
+  
+  CHECK( result == lorina::return_code::success );
+
+  tech_library<4> lib( gates );
+
+  CHECK( lib.max_gate_size() == 4 );
+  CHECK( lib.get_inverter_info() == std::make_tuple( 1.0f, 0.9f, 2u ) );
+
+  for ( auto const& gate : gates )
+  {
+    auto const tt = gate.function;
+
+    const auto test_enumeration = [&]( auto const& tt, auto, auto ) {
+      const auto static_tt = kitty::extend_to<4>( tt );
+
+      auto const supergates = lib.get_supergates( static_tt );
+
+      CHECK( supergates != nullptr );
+
+      bool found = false;
+      for ( auto const& supergate : *supergates )
+      {
+        if ( supergate.root->id == gate.id )
+        {
+          found = true;
+          break;
+        }
+      }
+
+      CHECK( found == true );
+    };
+
+    kitty::exact_np_enumeration( tt, test_enumeration );
+  }
+  
+}
\ No newline at end of file