microsoft · aciddelgado · Mar 25, 2025 · Mar 27, 2025 · baijumeswani · Mar 27, 2025
diff --git a/src/models/debugging.cpp b/src/models/debugging.cpp
@@ -83,22 +83,34 @@ void DumpTensor(const Model& model, std::ostream& stream, OrtValue* value, bool
   stream << SGR::Fg_Green << " Location: " << SGR::Reset;
 
   const auto& memory_info = value->GetTensorMemoryInfo();
-  switch (memory_info.GetDeviceType()) {
-    case OrtMemoryInfoDeviceType_CPU:
-      stream << "CPU\r\n";
+  if (memory_info.GetDeviceType() == OrtMemoryInfoDeviceType_CPU) {
+    stream << "CPU\r\n";
+    if (dump_value) {
       DumpValues(stream, type_info->GetElementType(), value->GetTensorRawData(), element_count);
-      break;
-    case OrtMemoryInfoDeviceType_GPU: {
-      stream << "GPU\r\n";
-      auto type = type_info->GetElementType();
-      auto tensor_span = std::span<uint8_t>{const_cast<OrtValue*>(value)->GetTensorMutableData<uint8_t>(), SizeOf(type) * element_count};
-      auto device_span = model.p_device_->WrapMemory<uint8_t>(tensor_span);
-      DumpValues(stream, type, device_span.CopyDeviceToCpu().data(), element_count);
-      break;
     }
-    default:
-      stream << "Unhandled device type: " << static_cast<int>(memory_info.GetDeviceType()) << "\r\n";
-      break;
+    // Internally there are 5 device types defined in onnxruntime but only 3 are exposed in the public API
+    // https://github.com/microsoft/onnxruntime/blob/9dbfee91ca9c2ba2074d19805bb6dedccedbcfe3/include/onnxruntime/core/framework/ortdevice.h#L15
+  } else if (memory_info.GetDeviceType() < 5) {
+    switch (model.p_device_->GetType()) {
+      case DeviceType::CUDA:
+        stream << "CUDA\r\n";
+        break;
+      case DeviceType::DML:
+        stream << "DML\r\n";
+        break;
+      case DeviceType::QNN:
+        stream << "QNN\r\n";
+        break;
+      default:
+        stream << "Unknown\r\n";
+        break;
+    }
+    auto type = type_info->GetElementType();
+    auto tensor_span = std::span<uint8_t>{const_cast<OrtValue*>(value)->GetTensorMutableData<uint8_t>(), SizeOf(type) * element_count};
+    auto device_span = model.p_device_->WrapMemory<uint8_t>(tensor_span);
+    DumpValues(stream, type, device_span.CopyDeviceToCpu().data(), element_count);
+  } else {
+    stream << "Unhandled device type: " << static_cast<int>(memory_info.GetDeviceType()) << "\r\n";
   }
 }