core/lowering/passes/unpack_log_softmax.cpp

#include "torch/csrc/jit/passes/subgraph_rewrite.h"

#include "core/util/prelude.h"

namespace torch_tensorrt {
namespace core {
namespace lowering {
namespace passes {

void UnpackLogSoftmax(std::shared_ptr<torch::jit::Graph>& graph) {
  // Its easier for TensorRT if we seperate softmax and log
  // There might need to be a reshape inserted see:
  // https://github.com/onnx/onnx-tensorrt/blob/5dca8737851118f6ab8a33ea1f7bcb7c9f06caf5/builtin_op_importers.cpp#L1593
  // Should the reshapes be added here or in the converter?

  std::string logsoftmax_pattern = R"IR(
        graph(%input, %dim, %dtype):
            %log_softmax = aten::log_softmax(%input, %dim, %dtype)
            return (%log_softmax))IR";
  std::string softmax_log_pattern = R"IR(
        graph(%input, %dim, %dtype):
            %softmax = aten::softmax(%input, %dim, %dtype)
            %log_softmax = aten::log(%softmax)
            return (%log_softmax))IR";
  std::string logsoftmax_none_pattern = R"IR(
        graph(%input, %dim):
            %dtype : int? = prim::Constant()
            %log_softmax = aten::log_softmax(%input, %dim, %dtype)
            return (%log_softmax))IR";
  std::string softmax_log_none_pattern = R"IR(
        graph(%input, %dim):
            %dtype : int? = prim::Constant()
            %softmax = aten::softmax(%input, %dim, %dtype)
            %log_softmax = aten::log(%softmax)
            return (%log_softmax))IR";

  torch::jit::SubgraphRewriter logsoftmax_to_softmax_log;
  logsoftmax_to_softmax_log.RegisterRewritePattern(logsoftmax_pattern, softmax_log_pattern);
  logsoftmax_to_softmax_log.runOnGraph(graph);

  torch::jit::SubgraphRewriter logsoftmax_none_to_softmax_log_none;
  logsoftmax_none_to_softmax_log_none.RegisterRewritePattern(logsoftmax_none_pattern, softmax_log_none_pattern);
  logsoftmax_none_to_softmax_log_none.runOnGraph(graph);
  LOG_GRAPH("Post unpack logsoftmax: " << *graph);
}

} // namespace passes
} // namespace lowering
} // namespace core
} // namespace torch_tensorrt