osquery · nachorpaez · Nov 13, 2023 · Nov 13, 2023 · Nov 13, 2023 · Nov 14, 2023
@@ -173,6 +173,7 @@ function(generateOsqueryTablesSystemSystemtable)
 
   elseif(DEFINED PLATFORM_WINDOWS)
     list(APPEND source_files
+      windows/ads.cpp
       windows/appcompat_shims.cpp
       windows/authenticode.cpp
       windows/autoexec.cpp

@@ -0,0 +1,193 @@
+/**
+ * Copyright (c) 2014-present, The osquery authors
+ *
+ * This source code is licensed as defined by the LICENSE file found in the
+ * root directory of this source tree.
+ *
+ * SPDX-License-Identifier: (Apache-2.0 OR GPL-2.0-only)
+ */
+
+#include <boost/algorithm/string/predicate.hpp>
+#include <boost/algorithm/string/trim.hpp>
+#include <boost/filesystem.hpp>
+#include <string>
+#include <windows.h>
+
+#include <osquery/core/tables.h>
+#include <osquery/filesystem/filesystem.h>
+#include <osquery/logger/logger.h>
+#include <osquery/utils/base64.h>
+#include <osquery/utils/chars.h>
+#include <osquery/utils/conversions/split.h>
+#include <osquery/utils/conversions/windows/strings.h>
+#include <osquery/utils/scope_guard.h>
+
+namespace fs = boost::filesystem;
+
+namespace osquery {
+namespace tables {
+
+const std::string kZoneIdentifierKey = "Zone.Identifier";
+
+void setRow(QueryData& results,
+            const std::string& path,
+            const std::string& key,
+            const std::string& value) {
+  Row r;
+  r["path"] = path;
+  r["directory"] = boost::filesystem::path(path).parent_path().string();
+  r["key"] = key;
+  if (isPrintable(value)) {
+    r["value"] = value;
+    r["base64"] = INTEGER(0);
+  } else {
+    r["value"] = base64::encode(value);
+    r["base64"] = INTEGER(1);
+  }
+  results.push_back(r);
+}
+
+void parseZoneIdentifier(QueryData& results,
+                         const std::string& path,
+                         const std::string& streamData) {
+  auto lines = split(streamData, "\n");
+  for (const auto& line : lines) {
+    auto key_len = line.find_first_of("=");
+    if (key_len == std::string::npos) {
+      continue;
+    }
+
+    setRow(results,
+           path,
+           line.substr(0, key_len),
+           line.substr(key_len + 1, line.size()));
+  }
+}
+
+// Process a file and extract all stream names and data.
+void enumerateStreams(QueryData& results, const std::string& path) {
+  WIN32_FIND_STREAM_DATA findStreamData;
+  HANDLE hFind = FindFirstStreamW(stringToWstring(path).c_str(),
+                                  FindStreamInfoStandard,
+                                  &findStreamData,
+                                  0);
+
+  auto fd_guard = scope_guard::create([&] { FindClose(hFind); });
+
+  if (hFind != INVALID_HANDLE_VALUE) {
+    do {
+      std::string stream(wstringToString(findStreamData.cStreamName));
+
+      // Split the stream string into a name and a type, format is
+      // ":streamname:$streamtype"
+      auto streamFullName = split(stream, ":");
+
+      if (streamFullName.size() != 2) {
+        LOG(WARNING) << "Invalid stream name found: '" << stream
+                     << "'. Skipping this entry";
+        continue;
+      }
+      std::string streamName = streamFullName[0];
+
+      // Skip unnamed stream since it represents the file content
+      if (streamName == "") {
+        continue;
+      }
+
+      std::string path_copy = path;
+      // Remove any potential trailing / from path string
+      if (boost::algorithm::ends_with(path_copy, "\\")) {
+        path_copy.pop_back();
+      }
+      std::stringstream streamPath;
+      streamPath << path_copy << ":" << streamName;
+      std::string streamData;
+
+      if (!readFile(streamPath.str(), streamData).ok()) {
+        LOG(INFO) << "Couldn't read stream data: " << streamPath.str();
+        continue;
+      }
+
+      if (streamName == kZoneIdentifierKey) {
+        parseZoneIdentifier(results, path, streamData);
+      } else {
+        // Remove trailing newlines
+        boost::trim_right(streamData);
+        setRow(results, path, streamName, streamData);
+      }
+    } while (FindNextStreamW(hFind, &findStreamData));
+  } else {
+    auto error_code = GetLastError();
+    if (error_code != ERROR_HANDLE_EOF) {
+      LOG(INFO) << "Error occurred while searching for streams in " << path
+                << ". Error code: " << error_code;
+    }
+  }
+}
+
+QueryData genAds(QueryContext& context) {
+  QueryData results;
+  // Resolve file paths for EQUALS and LIKE operations.
+  auto paths = context.constraints["path"].getAll(EQUALS);
+  context.expandConstraints(
+      "path",
+      LIKE,
+      paths,
+      ([&](const std::string& pattern, std::set<std::string>& out) {
+        std::vector<std::string> patterns;
+        auto status =
+            resolveFilePattern(pattern, patterns, GLOB_ALL | GLOB_NO_CANON);
+        if (status.ok()) {
+          for (const auto& resolved : patterns) {
+            out.insert(resolved);
+          }
+        }
+        return status;
+      }));
+
+  for (const auto& path_string : paths) {
+    boost::filesystem::path path = path_string;
+    boost::system::error_code ec;
+    // Folders can have ADS streams too
+    if (!(boost::filesystem::is_regular_file(path, ec) ||
+          boost::filesystem::is_directory(path, ec))) {
+      continue;
+    }
+    enumerateStreams(results, path.string());
+  }
+
+  // Resolve directories for EQUALS and LIKE operations.
+  auto directories = context.constraints["directory"].getAll(EQUALS);
+  context.expandConstraints(
+      "directory",
+      LIKE,
+      directories,
+      ([&](const std::string& pattern, std::set<std::string>& out) {
+        std::vector<std::string> patterns;
+        auto status =
+            resolveFilePattern(pattern, patterns, GLOB_FOLDERS | GLOB_NO_CANON);
+        if (status.ok()) {
+          for (const auto& resolved : patterns) {
+            out.insert(resolved);
+          }
+        }
+        return status;
+      }));
+
+  // Now loop through constraints using the directory column constraint.
+  for (const auto& directory_string : directories) {
+    if (!isReadable(directory_string) || !isDirectory(directory_string)) {
+      continue;
+    }
+
+    std::vector<std::string> files;
+    if (listFilesInDirectory(directory_string, files).ok()) {
+      for (const auto& file : files) {
+        enumerateStreams(results, file);
+      }
+    }
+  }
+  return results;
+}
+} // namespace tables
+} // namespace osquery
@@ -253,6 +253,7 @@ function(generateNativeTables)
     "sleuthkit/device_hash.table:linux,macos,windows"
     "sleuthkit/device_partitions.table:linux,macos,windows"
     "user_groups.table:linux,macos,windows"
+    "windows/ads.table:windows"
     "windows/background_activities_moderator.table:windows"
     "windows/bitlocker_info.table:windows"
     "windows/chassis_info.table:windows"

@@ -0,0 +1,13 @@
+table_name("ads")
+description("Returns the stream names and values for files using NTFS Alternate Data Streams (ADS).")
+schema([
+    Column("path", TEXT, "Absolute file path", required=True, index=True),
+    Column("directory", TEXT, "Directory of file(s)", required=True),
+    Column("key", TEXT, "Name of the value generated from the stream"),
+    Column("value", TEXT, "The parsed information from the attribute"),
+    Column("base64", INTEGER, "1 if the value is base64 encoded else 0"),
+])
+implementation("system/windows/ads@genAds")
+examples([
+  "select * from ads where path = 'C:\\Users\\admin\\Downloads\\test.exe'"
+])
@@ -282,6 +282,7 @@ function(generateTestsIntegrationTablesTestsTest)
 
   elseif(DEFINED PLATFORM_WINDOWS)
     set(platform_source_files
+      ads.cpp
       appcompat_shims.cpp
       arp_cache.cpp
       authenticode.cpp

@@ -0,0 +1,85 @@
+/**
+ * Copyright (c) 2014-present, The osquery authors
+ *
+ * This source code is licensed as defined by the LICENSE file found in the
+ * root directory of this source tree.
+ *
+ * SPDX-License-Identifier: (Apache-2.0 OR GPL-2.0-only)
+ */
+
+// Sanity check integration test for ads
+// Spec file: specs/windows/ads.table
+
+#include <osquery/filesystem/filesystem.h>
+#include <osquery/tests/integration/tables/helper.h>
+#include <string>
+
+namespace osquery {
+namespace table_tests {
+
+const std::string fileName = "test.txt";
+const std::string streamName = "teststream";
+const std::string streamContents = "This is some data in an alternate stream";
+
+class ads : public testing::Test {
+ public:
+  boost::filesystem::path directory;
+
+  void SetUp() override {
+    setUpEnvironment();
+
+    directory =
+        boost::filesystem::temp_directory_path() /
+        boost::filesystem::unique_path("test-integration-file-table.%%%%-%%%%");
+
+    ASSERT_TRUE(boost::filesystem::create_directory(directory));
+
+    auto filepath = directory / boost::filesystem::path(fileName);
+
+    // Create a file
+    std::ofstream file(filepath.native());
+    file << "This is the main file data";
+    file.close();
+
+    // Add data to alternate stream
+    std::string fullStreamPath = filepath.string() + ":" + streamName;
+    std::ofstream streamFile(fullStreamPath);
+    streamFile << streamContents;
+    streamFile.close();
+  }
+
+  virtual void TearDown() {
+    boost::filesystem::remove_all(directory);
+  }
+};
+
+TEST_F(ads, test_sanity) {
+  // std::string path_constraint =
+  //     (directory / boost::filesystem::path("%.txt")).string();
+
+  auto expected_path = directory.string();
+  expected_path += "\\";
+  expected_path += fileName;
+  QueryData data =
+      execute_query("select * from ads where path = \'" + expected_path + "\'");
+
+  auto& row = data.at(0);
+  ASSERT_EQ(row.at("key"), streamName);
+  ASSERT_EQ(row.at("value"), streamContents);
+  ASSERT_EQ(row.at("base64"), true);
+  ASSERT_EQ(row.at("path"), expected_path);
+  ASSERT_EQ(row.at("directory"), directory.string());
+
+  ValidationMap row_map = {
+      {"path", FileOnDisk},
+      {"directory", DirectoryOnDisk},
+      {"key", NormalType},
+      {"value", NormalType},
+      {"base64", IntType},
+  };
+
+  validate_rows(data, row_map);
+}
+
+} // namespace table_tests
+} // namespace osquery