tensorflow · tensorflow-copybara · Jul 7, 2020 · Jun 18, 2020 · Jul 6, 2020
diff --git a/tensorflow/compiler/xla/tools/replay_computation.cc b/tensorflow/compiler/xla/tools/replay_computation.cc
@@ -233,8 +233,14 @@ StatusOr<Literal> ReplayComputation(const HloSnapshot& module,
   if (opts.use_fake_data) {
     // Run fake computations with debug options ignoring XLA_FLAGS.  Users very
     // likely want XLA_FLAGS only to apply to the "real" computation being run,
-    // not to the fake computations we use for generating arguments.
+    // not to the fake computations we use for generating arguments. There is
+    // an exception. ptxas can be called during the generation of fake
+    // data. As it is cached in the process memory, the flag affecting this call
+    // should not be ignored.
+    auto debug_opts_flags = GetDebugOptionsFromFlags();
     auto debug_opts = DefaultDebugOptionsIgnoringFlags();
+    debug_opts.set_xla_gpu_asm_extra_flags(debug_opts_flags.xla_gpu_asm_extra_flags());
+
     global_data_arguments =
         MakeFakeArgumentsOrDie(computation, client, &debug_opts);
     for (const auto& data : global_data_arguments) {