Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions src/Storages/ObjectStorage/DataLakes/IDataLakeMetadata.h
Original file line number Diff line number Diff line change
Expand Up @@ -166,6 +166,9 @@ class IDataLakeMetadata : boost::noncopyable
virtual void checkAlterIsPossible(const AlterCommands & /*commands*/) { throwNotImplemented("alter"); }
virtual void alter(const AlterCommands & /*params*/, ContextPtr /*context*/) { throwNotImplemented("alter"); }

virtual std::optional<String> partitionKey(ContextPtr) const { return {}; }
virtual std::optional<String> sortingKey(ContextPtr) const { return {}; }

protected:
virtual ObjectIterator createKeysIterator(
Strings && data_files_,
Expand Down
204 changes: 203 additions & 1 deletion src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -258,6 +258,192 @@ bool IcebergMetadata::update(const ContextPtr & local_context)
return previous_snapshot_schema_id != relevant_snapshot_schema_id;
}

namespace
{

using IdToName = std::unordered_map<Int32, String>;

IdToName buildIdToNameMap(const Poco::JSON::Object::Ptr & metadata_obj)
{
IdToName map;
if (!metadata_obj || !metadata_obj->has("current-schema-id") || !metadata_obj->has("schemas"))
return map;

const auto current_schema_id = metadata_obj->getValue<Int32>("current-schema-id");
auto schemas = metadata_obj->getArray("schemas");
if (!schemas)
return map;

for (size_t i = 0; i < schemas->size(); ++i)
{
auto schema = schemas->getObject(i);

if (!schema || !schema->has("schema-id") || (schema->getValue<Int32>("schema-id") != current_schema_id))
continue;

if (auto fields = schema->getArray("fields"))
{
for (size_t j = 0; j < fields->size(); ++j)
{
auto f = fields->getObject(j);
if (!f || !f->has("id") || !f->has("name"))
continue;
map.emplace(f->getValue<Int32>("id"), f->getValue<String>("name"));
}
}
break;
}
return map;
}

String formatTransform(
const String & transform,
const Poco::JSON::Object::Ptr & field_obj,
const IdToName & id_to_name)
{
Int32 source_id = (field_obj && field_obj->has("source-id"))
? field_obj->getValue<Int32>("source-id")
: -1;

const auto it = id_to_name.find(source_id);
const String col = (it != id_to_name.end()) ? it->second : ("col_" + toString(source_id));

String base = transform;
String param;
if (const auto lpos = transform.find('['); lpos != String::npos && transform.back() == ']')
{
base = transform.substr(0, lpos);
param = transform.substr(lpos + 1, transform.size() - lpos - 2); // strip [ and ]
}

String result;
if (base == "identity")
result = col;
else if (base == "year" || base == "month" || base == "day" || base == "hour")
result = base + "(" + col + ")";
else if (base != "void")
{
if (!param.empty())
result = base + "(" + param + ", " + col + ")";
else
result = base + "(" + col + ")";
}
return result;
}

Poco::JSON::Array::Ptr findActivePartitionFields(const Poco::JSON::Object::Ptr & metadata_obj)
{
if (!metadata_obj)
return nullptr;

if (metadata_obj->has("partition-spec"))
return metadata_obj->getArray("partition-spec");

// If for some reason there is no partition-spec, try partition-specs + default-
if (metadata_obj->has("partition-specs") && metadata_obj->has("default-spec-id"))
{
const auto default_spec_id = metadata_obj->getValue<Int32>("default-spec-id");
if (auto specs = metadata_obj->getArray("partition-specs"))
{
for (size_t i = 0; i < specs->size(); ++i)
{
auto spec = specs->getObject(i);
if (!spec || !spec->has("spec-id"))
continue;
if (spec->getValue<Int32>("spec-id") == default_spec_id)
return spec->has("fields") ? spec->getArray("fields") : nullptr;
}
}
}

return nullptr;
}

Poco::JSON::Array::Ptr findActiveSortFields(const Poco::JSON::Object::Ptr & metadata_obj)
{
if (!metadata_obj || !metadata_obj->has("default-sort-order-id") || !metadata_obj->has("sort-orders"))
return nullptr;

const auto default_sort_order_id = metadata_obj->getValue<Int32>("default-sort-order-id");
auto orders = metadata_obj->getArray("sort-orders");
if (!orders)
return nullptr;

for (size_t i = 0; i < orders->size(); ++i)
{
auto order = orders->getObject(i);
if (!order || !order->has("order-id"))
continue;
if (order->getValue<Int32>("order-id") == default_sort_order_id)
return order->has("fields") ? order->getArray("fields") : nullptr;
}
return nullptr;
}

String composeList(
const Poco::JSON::Array::Ptr & fields,
const IdToName & id_to_name,
bool lookup_sort_modifiers)
{
if (!fields || fields->size() == 0)
return {};

Strings parts;
parts.reserve(fields->size());

for (size_t i = 0; i < fields->size(); ++i)
{
auto field = fields->getObject(i);
if (!field)
continue;

const String transform = field->has("transform") ? field->getValue<String>("transform") : "identity";
String expr = formatTransform(transform, field, id_to_name);
if (expr.empty())
continue;

if (lookup_sort_modifiers)
{
if (field->has("direction"))
{
auto d = field->getValue<String>("direction");
expr += (Poco::icompare(d, "desc") == 0) ? " DESC" : " ASC";
}
}

parts.push_back(std::move(expr));
}

if (parts.empty())
return {};

String res;
for (size_t i = 0; i < parts.size(); ++i)
{
if (i) res += ", ";
res += parts[i];
}
return res;
}

std::pair<std::optional<String>, std::optional<String>> extractIcebergKeys(const Poco::JSON::Object::Ptr & metadata_obj)
{
std::optional<String> partition_key;
std::optional<String> sort_key;

if (metadata_obj)
{
auto id_to_name = buildIdToNameMap(metadata_obj);

partition_key = composeList(findActivePartitionFields(metadata_obj), id_to_name, /*lookup_sort_modifiers=*/ false);
sort_key = composeList(findActiveSortFields(metadata_obj), id_to_name, /*lookup_sort_modifiers=*/ true);
}

return {partition_key, sort_key};
}

}

void IcebergMetadata::updateSnapshot(ContextPtr local_context, Poco::JSON::Object::Ptr metadata_object)
{
auto configuration_ptr = configuration.lock();
Expand Down Expand Up @@ -309,6 +495,7 @@ void IcebergMetadata::updateSnapshot(ContextPtr local_context, Poco::JSON::Objec
}
}

auto [partition_key, sorting_key] = extractIcebergKeys(metadata_object);
relevant_snapshot = std::make_shared<IcebergDataSnapshot>(
getManifestList(
object_storage,
Expand All @@ -324,7 +511,9 @@ void IcebergMetadata::updateSnapshot(ContextPtr local_context, Poco::JSON::Objec
relevant_snapshot_id,
total_rows,
total_bytes,
total_position_deletes);
total_position_deletes,
partition_key,
sorting_key);

if (!snapshot->has(f_schema_id))
throw Exception(
Expand Down Expand Up @@ -777,6 +966,19 @@ std::optional<size_t> IcebergMetadata::totalBytes(ContextPtr local_context) cons
return result;
}

std::optional<String> IcebergMetadata::partitionKey(ContextPtr) const
{
SharedLockGuard lock(mutex);
return relevant_snapshot->partition_key;
}

std::optional<String> IcebergMetadata::sortingKey(ContextPtr) const
{
SharedLockGuard lock(mutex);
return relevant_snapshot->sorting_key;
}


ObjectIterator IcebergMetadata::iterate(
const ActionsDAG * filter_dag,
FileProgressCallback callback,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -121,6 +121,9 @@ class IcebergMetadata : public IDataLakeMetadata
void checkAlterIsPossible(const AlterCommands & commands) override;
void alter(const AlterCommands & params, ContextPtr context) override;

std::optional<String> partitionKey(ContextPtr) const override;
std::optional<String> sortingKey(ContextPtr) const override;

protected:
ObjectIterator
iterate(const ActionsDAG * filter_dag, FileProgressCallback callback, size_t list_batch_size, ContextPtr local_context) const override;
Expand Down
2 changes: 2 additions & 0 deletions src/Storages/ObjectStorage/DataLakes/Iceberg/Snapshot.h
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,8 @@ struct IcebergDataSnapshot
std::optional<size_t> total_rows;
std::optional<size_t> total_bytes;
std::optional<size_t> total_position_delete_rows;
std::optional<String> partition_key;
std::optional<String> sorting_key;

std::optional<size_t> getTotalRows() const
{
Expand Down
54 changes: 46 additions & 8 deletions src/Storages/System/StorageSystemTables.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,8 @@
#include <QueryPipeline/Pipe.h>
#include <QueryPipeline/QueryPipelineBuilder.h>
#include <Storages/MergeTree/MergeTreeData.h>
#include <Storages/ObjectStorage/StorageObjectStorageCluster.h>
#include <Storages/ObjectStorage/DataLakes/IDataLakeMetadata.h>
#include <Storages/SelectQueryInfo.h>
#include <Storages/StorageView.h>
#include <Storages/System/getQueriedColumnsMaskAndHeader.h>
Expand Down Expand Up @@ -604,18 +606,54 @@ class TablesBlockSource : public ISource
ASTPtr expression_ptr;
if (columns_mask[src_index++])
{
if (metadata_snapshot && (expression_ptr = metadata_snapshot->getPartitionKeyAST()))
res_columns[res_index++]->insert(format({context, *expression_ptr}));
else
res_columns[res_index++]->insertDefault();
bool inserted = false;
// Extract from specific DataLake metadata if suitable
if (auto * obj = dynamic_cast<StorageObjectStorageCluster *>(table.get()))
{
if (auto * dl_meta = obj->getExternalMetadata(context))
{
if (auto p = dl_meta->partitionKey(context); p.has_value())
{
res_columns[res_index++]->insert(*p);
inserted = true;
}
}

}

if (!inserted)
{
if (metadata_snapshot && (expression_ptr = metadata_snapshot->getPartitionKeyAST()))
res_columns[res_index++]->insert(format({context, *expression_ptr}));
else
res_columns[res_index++]->insertDefault();
}
}

if (columns_mask[src_index++])
{
if (metadata_snapshot && (expression_ptr = metadata_snapshot->getSortingKey().expression_list_ast))
res_columns[res_index++]->insert(format({context, *expression_ptr}));
else
res_columns[res_index++]->insertDefault();
bool inserted = false;

// Extract from specific DataLake metadata if suitable
if (auto * obj = dynamic_cast<StorageObjectStorageCluster *>(table.get()))
{
if (auto * dl_meta = obj->getExternalMetadata(context))
{
if (auto p = dl_meta->sortingKey(context); p.has_value())
{
res_columns[res_index++]->insert(*p);
inserted = true;
}
}
}

if (!inserted)
{
if (metadata_snapshot && (expression_ptr = metadata_snapshot->getSortingKey().expression_list_ast))
res_columns[res_index++]->insert(format({context, *expression_ptr}));
else
res_columns[res_index++]->insertDefault();
}
}

if (columns_mask[src_index++])
Expand Down
Loading
Loading