From 05ac5bc8db5f0a1b374bebf7776bdf16a75ad740 Mon Sep 17 00:00:00 2001
From: Vasily Nemkov <vnemkov@altinity.com>
Date: Thu, 9 Oct 2025 21:15:48 +0200
Subject: [PATCH 01/12] 26.1 Antalya port - Alternative syntax for cluster
 functions

---
 .../FunctionSecretArgumentsFinderTreeNode.h   |  10 +-
 src/Core/Settings.cpp                         |   9 +
 src/Core/SettingsChangesHistory.cpp           |  14 +
 src/Databases/DataLake/DatabaseDataLake.cpp   |  42 +-
 src/Databases/DataLake/DatabaseDataLake.h     |   2 +-
 src/Databases/DataLake/GlueCatalog.cpp        |   2 +-
 src/Disks/DiskType.cpp                        |  63 +-
 src/Disks/DiskType.h                          |   5 +-
 src/Interpreters/Cluster.cpp                  |  37 +-
 src/Interpreters/Cluster.h                    |   7 +-
 src/Interpreters/InterpreterCreateQuery.cpp   |   3 +-
 src/Parsers/FunctionSecretArgumentsFinder.h   | 104 ++-
 .../FunctionSecretArgumentsFinderAST.h        |   9 +-
 src/Server/TCPHandler.cpp                     |   2 +-
 src/Storages/HivePartitioningUtils.cpp        |   6 +-
 src/Storages/IStorage.h                       |   3 +
 src/Storages/IStorageCluster.cpp              |  38 +-
 src/Storages/IStorageCluster.h                |  38 +-
 .../ObjectStorage/Azure/Configuration.cpp     |  41 +-
 .../ObjectStorage/Azure/Configuration.h       |  15 +-
 .../DataLakes/DataLakeConfiguration.h         | 400 ++++++++++-
 .../DataLakes/DataLakeStorageSettings.h       |   3 +
 .../DeltaLakeMetadataDeltaKernel.cpp          |  10 +-
 .../ObjectStorage/DataLakes/HudiMetadata.cpp  |   2 +-
 .../DataLakes/Iceberg/IcebergMetadata.cpp     |   2 +-
 .../DataLakes/Iceberg/IcebergWrites.cpp       |   2 +-
 .../ObjectStorage/HDFS/Configuration.cpp      |   8 +
 .../ObjectStorage/HDFS/Configuration.h        |   2 +
 .../ObjectStorage/ReadBufferIterator.cpp      |  10 +-
 .../ObjectStorage/S3/Configuration.cpp        |  27 +
 src/Storages/ObjectStorage/S3/Configuration.h |   2 +
 .../ObjectStorage/StorageObjectStorage.cpp    |  59 +-
 .../ObjectStorage/StorageObjectStorage.h      |   2 +-
 .../StorageObjectStorageCluster.cpp           | 619 +++++++++++++++++-
 .../StorageObjectStorageCluster.h             | 126 +++-
 .../StorageObjectStorageConfiguration.cpp     |  41 +-
 .../StorageObjectStorageConfiguration.h       |  59 +-
 .../StorageObjectStorageSettings.h            |  10 +
 .../StorageObjectStorageSink.cpp              |   6 +-
 .../StorageObjectStorageSource.cpp            |  14 +-
 src/Storages/ObjectStorage/Utils.cpp          |  15 +-
 src/Storages/ObjectStorage/Utils.h            |   3 +-
 .../registerStorageObjectStorage.cpp          |  33 +-
 .../StorageObjectStorageQueue.cpp             |   8 +-
 .../StorageObjectStorageQueue.h               |   2 +-
 .../registerQueueStorage.cpp                  |   2 +-
 .../System/StorageSystemIcebergHistory.cpp    |   6 +-
 .../extractTableFunctionFromSelectQuery.cpp   |  11 +-
 .../extractTableFunctionFromSelectQuery.h     |   3 +-
 src/TableFunctions/ITableFunction.h           |   2 +-
 src/TableFunctions/ITableFunctionCluster.h    |   7 +-
 .../TableFunctionObjectStorage.cpp            | 177 +----
 .../TableFunctionObjectStorage.h              |  30 +-
 .../TableFunctionObjectStorageCluster.cpp     |  41 +-
 .../TableFunctionObjectStorageCluster.h       |  19 +-
 ...leFunctionObjectStorageClusterFallback.cpp | 449 +++++++++++++
 ...ableFunctionObjectStorageClusterFallback.h |  49 ++
 src/TableFunctions/registerTableFunctions.cpp |   1 +
 src/TableFunctions/registerTableFunctions.h   |   1 +
 tests/integration/helpers/iceberg_utils.py    |  90 ++-
 .../test_mask_sensitive_info/test.py          | 110 +++-
 tests/integration/test_s3_cluster/test.py     | 325 ++++++++-
 .../configs/config.d/named_collections.xml    |  14 +
 .../configs/config.d/named_collections.xml    |  14 +
 .../test_cluster_table_function.py            | 178 ++++-
 .../test_types.py                             |  46 ++
 66 files changed, 2968 insertions(+), 522 deletions(-)
 create mode 100644 src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
 create mode 100644 src/TableFunctions/TableFunctionObjectStorageClusterFallback.h

diff --git a/src/Analyzer/FunctionSecretArgumentsFinderTreeNode.h b/src/Analyzer/FunctionSecretArgumentsFinderTreeNode.h
index 8bcb6e147420..e4f63192c95b 100644
--- a/src/Analyzer/FunctionSecretArgumentsFinderTreeNode.h
+++ b/src/Analyzer/FunctionSecretArgumentsFinderTreeNode.h
@@ -71,8 +71,14 @@ class FunctionTreeNodeImpl : public AbstractFunction
     {
     public:
         explicit ArgumentsTreeNode(const QueryTreeNodes * arguments_) : arguments(arguments_) {}
-        size_t size() const override { return arguments ? arguments->size() : 0; }
-        std::unique_ptr<Argument> at(size_t n) const override { return std::make_unique<ArgumentTreeNode>(arguments->at(n).get()); }
+        size_t size() const override
+        { /// size withous skipped indexes
+            return arguments ? arguments->size() - skippedSize() : 0;
+        }
+        std::unique_ptr<Argument> at(size_t n) const override
+        { /// n is relative index, some can be skipped
+            return std::make_unique<ArgumentTreeNode>(arguments->at(getRealIndex(n)).get());
+        }
     private:
         const QueryTreeNodes * arguments = nullptr;
     };
diff --git a/src/Core/Settings.cpp b/src/Core/Settings.cpp
index e72653747d54..6ca5df143995 100644
--- a/src/Core/Settings.cpp
+++ b/src/Core/Settings.cpp
@@ -7441,6 +7441,15 @@ Enable PRQL - an alternative to SQL.
 )", EXPERIMENTAL) \
     DECLARE(Bool, enable_adaptive_memory_spill_scheduler, false, R"(
 Trigger processor to spill data into external storage adpatively. grace join is supported at present.
+)", EXPERIMENTAL) \
+    DECLARE(String, object_storage_cluster, "", R"(
+Cluster to make distributed requests to object storages with alternative syntax.
+)", EXPERIMENTAL) \
+    DECLARE(UInt64, object_storage_max_nodes, 0, R"(
+Limit for hosts used for request in object storage cluster table functions - azureBlobStorageCluster, s3Cluster, hdfsCluster, etc.
+Possible values:
+- Positive integer.
+- 0 — All hosts in cluster.
 )", EXPERIMENTAL) \
     DECLARE(Bool, allow_experimental_delta_kernel_rs, true, R"(
 Allow experimental delta-kernel-rs implementation.
diff --git a/src/Core/SettingsChangesHistory.cpp b/src/Core/SettingsChangesHistory.cpp
index e8686e2a43ea..949e63ed8a49 100644
--- a/src/Core/SettingsChangesHistory.cpp
+++ b/src/Core/SettingsChangesHistory.cpp
@@ -39,6 +39,11 @@ const VersionToSettingsChangesMap & getSettingsChangesHistory()
         /// controls new feature and it's 'true' by default, use 'false' as previous_value).
         /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
         /// Note: please check if the key already exists to prevent duplicate entries.
+        addSettingsChanges(settings_changes_history, "26.1.1.2000",
+        {
+            {"object_storage_cluster", "", "", "Antalya: New setting"},
+            {"object_storage_max_nodes", 0, 0, "Antalya: New setting"},
+        });
         addSettingsChanges(settings_changes_history, "26.1",
         {
             {"parallel_replicas_filter_pushdown", false, false, "New setting"},
@@ -312,6 +317,15 @@ const VersionToSettingsChangesMap & getSettingsChangesHistory()
             {"allow_experimental_insert_into_iceberg", false, false, "New setting."},
             /// RELEASE CLOSED
         });
+        addSettingsChanges(settings_changes_history, "25.6.5.2000",
+        {
+            {"allow_experimental_database_iceberg", false, true, "Turned ON by default for Antalya"},
+            {"allow_experimental_database_unity_catalog", false, true, "Turned ON by default for Antalya"},
+            {"allow_experimental_database_glue_catalog", false, true, "Turned ON by default for Antalya"},
+            {"output_format_parquet_enum_as_byte_array", true, true, "Enable writing Enum as byte array in Parquet by default"},
+            {"object_storage_cluster", "", "", "New setting"},
+            {"object_storage_max_nodes", 0, 0, "New setting"},
+        });
         addSettingsChanges(settings_changes_history, "25.6",
         {
             /// RELEASE CLOSED
diff --git a/src/Databases/DataLake/DatabaseDataLake.cpp b/src/Databases/DataLake/DatabaseDataLake.cpp
index d617751a3eb6..e96b5ff7d5ab 100644
--- a/src/Databases/DataLake/DatabaseDataLake.cpp
+++ b/src/Databases/DataLake/DatabaseDataLake.cpp
@@ -55,6 +55,7 @@ namespace DatabaseDataLakeSetting
     extern const DatabaseDataLakeSettingsString oauth_server_uri;
     extern const DatabaseDataLakeSettingsBool oauth_server_use_request_body;
     extern const DatabaseDataLakeSettingsBool vended_credentials;
+    extern const DatabaseDataLakeSettingsString object_storage_cluster;
     extern const DatabaseDataLakeSettingsString aws_access_key_id;
     extern const DatabaseDataLakeSettingsString aws_secret_access_key;
     extern const DatabaseDataLakeSettingsString region;
@@ -241,7 +242,7 @@ std::shared_ptr<DataLake::ICatalog> DatabaseDataLake::getCatalog() const
     return catalog_impl;
 }
 
-std::shared_ptr<StorageObjectStorageConfiguration> DatabaseDataLake::getConfiguration(
+StorageObjectStorageConfigurationPtr DatabaseDataLake::getConfiguration(
     DatabaseDataLakeStorageType type,
     DataLakeStorageSettingsPtr storage_settings) const
 {
@@ -567,7 +568,7 @@ StoragePtr DatabaseDataLake::tryGetTableImpl(const String & name, ContextPtr con
 
     /// with_table_structure = false: because there will be
     /// no table structure in table definition AST.
-    StorageObjectStorageConfiguration::initialize(*configuration, args, context_copy, /* with_table_structure */false);
+    configuration->initialize(args, context_copy, /* with_table_structure */false);
 
     const auto & query_settings = context_->getSettingsRef();
 
@@ -579,49 +580,34 @@ StoragePtr DatabaseDataLake::tryGetTableImpl(const String & name, ContextPtr con
 
     const auto is_secondary_query = context_->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
 
-    if (can_use_parallel_replicas && !is_secondary_query)
-    {
-        auto storage_cluster = std::make_shared<StorageObjectStorageCluster>(
-            parallel_replicas_cluster_name,
-            configuration,
-            configuration->createObjectStorage(context_copy, /* is_readonly */ false),
-            StorageID(getDatabaseName(), name),
-            columns,
-            ConstraintsDescription{},
-            nullptr,
-            context_,
-            /// Use is_table_function = true,
-            /// because this table is actually stateless like a table function.
-            /* is_table_function */true);
-
-        storage_cluster->startup();
-        return storage_cluster;
-    }
+    auto cluster_name = settings[DatabaseDataLakeSetting::object_storage_cluster].value;
 
-    bool can_use_distributed_iterator =
-        context_->getClientInfo().collaborate_with_initiator &&
-        can_use_parallel_replicas;
+    if (can_use_parallel_replicas && !is_secondary_query)
+        cluster_name = parallel_replicas_cluster_name;
 
-    return std::make_shared<StorageObjectStorage>(
+    auto storage_cluster = std::make_shared<StorageObjectStorageCluster>(
+        cluster_name,
         configuration,
         configuration->createObjectStorage(context_copy, /* is_readonly */ false),
-        context_copy,
         StorageID(getDatabaseName(), name),
         /* columns */columns,
         /* constraints */ConstraintsDescription{},
+        /* partition_by */nullptr,
+        /* order_by */nullptr,
+        context_copy,
         /* comment */"",
         getFormatSettings(context_copy),
         LoadingStrictnessLevel::CREATE,
         getCatalog(),
         /* if_not_exists*/true,
         /* is_datalake_query*/true,
-        /* distributed_processing */can_use_distributed_iterator,
-        /* partition_by */nullptr,
-        /* order_by */nullptr,
         /// Use is_table_function = true,
         /// because this table is actually stateless like a table function.
         /* is_table_function */true,
         /* lazy_init */true);
+
+    storage_cluster->startup();
+    return storage_cluster;
 }
 
 void DatabaseDataLake::dropTable( /// NOLINT
diff --git a/src/Databases/DataLake/DatabaseDataLake.h b/src/Databases/DataLake/DatabaseDataLake.h
index bed47c5ccae6..736b951b0b21 100644
--- a/src/Databases/DataLake/DatabaseDataLake.h
+++ b/src/Databases/DataLake/DatabaseDataLake.h
@@ -84,7 +84,7 @@ class DatabaseDataLake final : public IDatabase, WithContext
     void validateSettings();
     std::shared_ptr<DataLake::ICatalog> getCatalog() const;
 
-    std::shared_ptr<StorageObjectStorageConfiguration> getConfiguration(
+    StorageObjectStorageConfigurationPtr getConfiguration(
         DatabaseDataLakeStorageType type,
         DataLakeStorageSettingsPtr storage_settings) const;
 
diff --git a/src/Databases/DataLake/GlueCatalog.cpp b/src/Databases/DataLake/GlueCatalog.cpp
index 0bb26afaafa1..28688afa4c34 100644
--- a/src/Databases/DataLake/GlueCatalog.cpp
+++ b/src/Databases/DataLake/GlueCatalog.cpp
@@ -513,7 +513,7 @@ GlueCatalog::ObjectStorageWithPath GlueCatalog::createObjectStorageForEarlyTable
     auto storage_settings = std::make_shared<DB::DataLakeStorageSettings>();
     storage_settings->loadFromSettingsChanges(settings.allChanged());
     auto configuration = std::make_shared<DB::StorageS3IcebergConfiguration>(storage_settings);
-    DB::StorageObjectStorageConfiguration::initialize(*configuration, args, getContext(), false);
+    configuration->initialize(args, getContext(), false);
 
     auto object_storage = configuration->createObjectStorage(getContext(), true);
 
diff --git a/src/Disks/DiskType.cpp b/src/Disks/DiskType.cpp
index bf4506b4cbf6..ddc42cd07dc3 100644
--- a/src/Disks/DiskType.cpp
+++ b/src/Disks/DiskType.cpp
@@ -10,7 +10,7 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-MetadataStorageType metadataTypeFromString(const String & type)
+MetadataStorageType metadataTypeFromString(const std::string & type)
 {
     auto check_type = Poco::toLower(type);
     if (check_type == "local")
@@ -58,25 +58,7 @@ String DataSourceDescription::name() const
         case DataSourceType::RAM:
             return "memory";
         case DataSourceType::ObjectStorage:
-        {
-            switch (object_storage_type)
-            {
-                case ObjectStorageType::S3:
-                    return "s3";
-                case ObjectStorageType::HDFS:
-                    return "hdfs";
-                case ObjectStorageType::Azure:
-                    return "azure_blob_storage";
-                case ObjectStorageType::Local:
-                    return "local_blob_storage";
-                case ObjectStorageType::Web:
-                    return "web";
-                case ObjectStorageType::None:
-                    return "none";
-                case ObjectStorageType::Max:
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected object storage type: Max");
-            }
-        }
+            return DB::toString(object_storage_type);
     }
 }
 
@@ -86,4 +68,45 @@ String DataSourceDescription::toString() const
                        name(), description, is_encrypted, is_cached, zookeeper_name);
 }
 
+ObjectStorageType objectStorageTypeFromString(const std::string & type)
+{
+    auto check_type = Poco::toLower(type);
+    if (check_type == "s3")
+        return ObjectStorageType::S3;
+    if (check_type == "hdfs")
+        return ObjectStorageType::HDFS;
+    if (check_type == "azure_blob_storage" || check_type == "azure")
+        return ObjectStorageType::Azure;
+    if (check_type == "local_blob_storage" || check_type == "local")
+        return ObjectStorageType::Local;
+    if (check_type == "web")
+        return ObjectStorageType::Web;
+    if (check_type == "none")
+        return ObjectStorageType::None;
+
+    throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG,
+        "Unknown object storage type: {}", type);
+}
+
+std::string toString(ObjectStorageType type)
+{
+    switch (type)
+    {
+        case ObjectStorageType::S3:
+            return "s3";
+        case ObjectStorageType::HDFS:
+            return "hdfs";
+        case ObjectStorageType::Azure:
+            return "azure_blob_storage";
+        case ObjectStorageType::Local:
+            return "local_blob_storage";
+        case ObjectStorageType::Web:
+            return "web";
+        case ObjectStorageType::None:
+            return "none";
+        case ObjectStorageType::Max:
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected object storage type: Max");
+    }
+}
+
 }
diff --git a/src/Disks/DiskType.h b/src/Disks/DiskType.h
index 9018cd605481..835c1341775b 100644
--- a/src/Disks/DiskType.h
+++ b/src/Disks/DiskType.h
@@ -36,7 +36,10 @@ enum class MetadataStorageType : uint8_t
     Memory,
 };
 
-MetadataStorageType metadataTypeFromString(const String & type);
+MetadataStorageType metadataTypeFromString(const std::string & type);
+
+ObjectStorageType objectStorageTypeFromString(const std::string & type);
+std::string toString(ObjectStorageType type);
 
 struct DataSourceDescription
 {
diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index fb6249c5e3e4..a3e7014469de 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -741,9 +741,9 @@ void Cluster::initMisc()
     }
 }
 
-std::unique_ptr<Cluster> Cluster::getClusterWithReplicasAsShards(const Settings & settings, size_t max_replicas_from_shard) const
+std::unique_ptr<Cluster> Cluster::getClusterWithReplicasAsShards(const Settings & settings, size_t max_replicas_from_shard, size_t max_hosts) const
 {
-    return std::unique_ptr<Cluster>{ new Cluster(ReplicasAsShardsTag{}, *this, settings, max_replicas_from_shard)};
+    return std::unique_ptr<Cluster>{ new Cluster(ReplicasAsShardsTag{}, *this, settings, max_replicas_from_shard, max_hosts)};
 }
 
 std::unique_ptr<Cluster> Cluster::getClusterWithSingleShard(size_t index) const
@@ -792,7 +792,7 @@ void shuffleReplicas(std::vector<Cluster::Address> & replicas, const Settings &
 
 }
 
-Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Settings & settings, size_t max_replicas_from_shard)
+Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Settings & settings, size_t max_replicas_from_shard, size_t max_hosts)
 {
     if (from.addresses_with_failover.empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cluster is empty");
@@ -814,6 +814,7 @@ Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Setti
 
                 if (address.is_local)
                     info.local_addresses.push_back(address);
+                addresses_with_failover.emplace_back(Addresses({address}));
 
                 auto pool = ConnectionPoolFactory::instance().get(
                     static_cast<unsigned>(settings[Setting::distributed_connections_pool_size]),
@@ -837,9 +838,6 @@ Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Setti
                 info.per_replica_pools = {std::move(pool)};
                 info.default_database = address.default_database;
 
-                addresses_with_failover.emplace_back(Addresses{address});
-
-                slot_to_shard.insert(std::end(slot_to_shard), info.weight, shards_info.size());
                 shards_info.emplace_back(std::move(info));
             }
         };
@@ -861,10 +859,37 @@ Cluster::Cluster(Cluster::ReplicasAsShardsTag, const Cluster & from, const Setti
     secret = from.secret;
     name = from.name;
 
+    constrainShardInfoAndAddressesToMaxHosts(max_hosts);
+
+    for (size_t i = 0; i < shards_info.size(); ++i)
+        slot_to_shard.insert(std::end(slot_to_shard), shards_info[i].weight, i);
+
     initMisc();
 }
 
 
+void Cluster::constrainShardInfoAndAddressesToMaxHosts(size_t max_hosts)
+{
+    if (max_hosts == 0 || shards_info.size() <= max_hosts)
+        return;
+
+    pcg64_fast gen{randomSeed()};
+    std::shuffle(shards_info.begin(), shards_info.end(), gen);
+    shards_info.resize(max_hosts);
+
+    AddressesWithFailover addresses_with_failover_;
+
+    UInt32 shard_num = 0;
+    for (auto & shard_info : shards_info)
+    {
+        addresses_with_failover_.push_back(addresses_with_failover[shard_info.shard_num - 1]);
+        shard_info.shard_num = ++shard_num;
+    }
+
+    addresses_with_failover.swap(addresses_with_failover_);
+}
+
+
 Cluster::Cluster(Cluster::SubclusterTag, const Cluster & from, const std::vector<size_t> & indices)
 {
     for (size_t index : indices)
diff --git a/src/Interpreters/Cluster.h b/src/Interpreters/Cluster.h
index b5a4c51c11db..f9b581034ef7 100644
--- a/src/Interpreters/Cluster.h
+++ b/src/Interpreters/Cluster.h
@@ -270,7 +270,7 @@ class Cluster
     std::unique_ptr<Cluster> getClusterWithMultipleShards(const std::vector<size_t> & indices) const;
 
     /// Get a new Cluster that contains all servers (all shards with all replicas) from existing cluster as independent shards.
-    std::unique_ptr<Cluster> getClusterWithReplicasAsShards(const Settings & settings, size_t max_replicas_from_shard = 0) const;
+    std::unique_ptr<Cluster> getClusterWithReplicasAsShards(const Settings & settings, size_t max_replicas_from_shard = 0, size_t max_hosts = 0) const;
 
     /// Returns false if cluster configuration doesn't allow to use it for cross-replication.
     /// NOTE: true does not mean, that it's actually a cross-replication cluster.
@@ -296,7 +296,7 @@ class Cluster
 
     /// For getClusterWithReplicasAsShards implementation
     struct ReplicasAsShardsTag {};
-    Cluster(ReplicasAsShardsTag, const Cluster & from, const Settings & settings, size_t max_replicas_from_shard);
+    Cluster(ReplicasAsShardsTag, const Cluster & from, const Settings & settings, size_t max_replicas_from_shard, size_t max_hosts);
 
     void addShard(
         const Settings & settings,
@@ -308,6 +308,9 @@ class Cluster
         ShardInfoInsertPathForInternalReplication insert_paths = {},
         bool internal_replication = false);
 
+    /// Reduce size of cluster to max_hosts
+    void constrainShardInfoAndAddressesToMaxHosts(size_t max_hosts);
+
     /// Inter-server secret
     String secret;
 
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 435aa65af41d..05e60f09224c 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1991,8 +1991,7 @@ bool InterpreterCreateQuery::doCreateTable(ASTCreateQuery & create,
         auto table_function_ast = create.getChild(*create.as_table_function);
         auto table_function = TableFunctionFactory::instance().get(table_function_ast, getContext());
 
-        if (!table_function->canBeUsedToCreateTable())
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table function '{}' cannot be used to create a table", table_function->getName());
+        table_function->validateUseToCreateTable();
 
         /// In case of CREATE AS table_function() query we should use global context
         /// in storage creation because there will be no query context on server startup
diff --git a/src/Parsers/FunctionSecretArgumentsFinder.h b/src/Parsers/FunctionSecretArgumentsFinder.h
index 8a3ef97422e8..847762631517 100644
--- a/src/Parsers/FunctionSecretArgumentsFinder.h
+++ b/src/Parsers/FunctionSecretArgumentsFinder.h
@@ -3,9 +3,12 @@
 #include <Common/KnownObjectNames.h>
 #include <Common/re2.h>
 #include <Common/maskURIPassword.h>
+#include <Common/NamedCollections/NamedCollections.h>
+#include <Common/NamedCollections/NamedCollectionsFactory.h>
 #include <Core/QualifiedTableName.h>
 #include <base/defines.h>
 #include <boost/algorithm/string/predicate.hpp>
+#include <Poco/String.h>
 
 
 namespace DB
@@ -29,6 +32,21 @@ class AbstractFunction
         virtual ~Arguments() = default;
         virtual size_t size() const = 0;
         virtual std::unique_ptr<Argument> at(size_t n) const = 0;
+        void skipArgument(size_t n) { skipped_indexes.insert(n); }
+        void unskipArguments() { skipped_indexes.clear(); }
+        size_t getRealIndex(size_t n) const
+        {
+            for (auto idx : skipped_indexes)
+            {
+                if (n < idx)
+                    break;
+                ++n;
+            }
+            return n;
+        }
+        size_t skippedSize() const { return skipped_indexes.size(); }
+    private:
+        std::set<size_t> skipped_indexes;
     };
 
     virtual ~AbstractFunction() = default;
@@ -77,14 +95,15 @@ class FunctionSecretArgumentsFinder
     {
         if (index >= function->arguments->size())
             return;
+        auto real_index = function->arguments->getRealIndex(index);
         if (!result.count)
         {
-            result.start = index;
+            result.start = real_index;
             result.are_named = argument_is_named;
         }
-        chassert(index >= result.start); /// We always check arguments consecutively
+        chassert(real_index >= result.start); /// We always check arguments consecutively
         chassert(result.replacement.empty()); /// We shouldn't use replacement with masking other arguments
-        result.count = index + 1 - result.start;
+        result.count = real_index + 1 - result.start;
         if (!argument_is_named)
             result.are_named = false;
     }
@@ -102,8 +121,12 @@ class FunctionSecretArgumentsFinder
         {
             findMongoDBSecretArguments();
         }
+        else if (function->name() == "iceberg")
+        {
+            findIcebergFunctionSecretArguments();
+        }
         else if ((function->name() == "s3") || (function->name() == "cosn") || (function->name() == "oss") ||
-                 (function->name() == "deltaLake") || (function->name() == "hudi") || (function->name() == "iceberg") ||
+                 (function->name() == "deltaLake") || (function->name() == "hudi") ||
                  (function->name() == "gcs") || (function->name() == "icebergS3") || (function->name() == "paimon") ||
                  (function->name() == "paimonS3"))
         {
@@ -270,6 +293,12 @@ class FunctionSecretArgumentsFinder
             findSecretNamedArgument("secret_access_key", 1);
             return;
         }
+        if (is_cluster_function && isNamedCollectionName(1))
+        {
+            /// s3Cluster(cluster, named_collection, ..., secret_access_key = 'secret_access_key', ...)
+            findSecretNamedArgument("secret_access_key", 2);
+            return;
+        }
 
         findSecretNamedArgument("secret_access_key", url_arg_idx);
 
@@ -277,6 +306,7 @@ class FunctionSecretArgumentsFinder
         /// s3('url', NOSIGN, 'format' [, 'compression'] [, extra_credentials(..)] [, headers(..)])
         /// s3('url', 'format', 'structure' [, 'compression'] [, extra_credentials(..)] [, headers(..)])
         size_t count = excludeS3OrURLNestedMaps();
+
         if ((url_arg_idx + 3 <= count) && (count <= url_arg_idx + 4))
         {
             String second_arg;
@@ -341,6 +371,48 @@ class FunctionSecretArgumentsFinder
             markSecretArgument(url_arg_idx + 4);
     }
 
+    std::string findIcebergStorageType()
+    {
+        std::string storage_type = "s3";
+
+        size_t count = function->arguments->size();
+        if (!count)
+            return storage_type;
+
+        auto storage_type_idx = findNamedArgument(&storage_type, "storage_type");
+        if (storage_type_idx != -1)
+        {
+            storage_type = Poco::toLower(storage_type);
+            function->arguments->skipArgument(storage_type_idx);
+        }
+        else if (isNamedCollectionName(0))
+        {
+            std::string collection_name;
+            if (function->arguments->at(0)->tryGetString(&collection_name, true))
+            {
+                NamedCollectionPtr collection = NamedCollectionFactory::instance().tryGet(collection_name);
+                if (collection && collection->has("storage_type"))
+                {
+                    storage_type = Poco::toLower(collection->get<std::string>("storage_type"));
+                }
+            }
+        }
+
+        return storage_type;
+    }
+
+    void findIcebergFunctionSecretArguments()
+    {
+        auto storage_type = findIcebergStorageType();
+
+        if (storage_type == "s3")
+            findS3FunctionSecretArguments(false);
+        else if (storage_type == "azure")
+            findAzureBlobStorageFunctionSecretArguments(false);
+
+        function->arguments->unskipArguments();
+    }
+
     bool maskAzureConnectionString(ssize_t url_arg_idx, bool argument_is_named = false, size_t start = 0)
     {
         String url_arg;
@@ -364,7 +436,7 @@ class FunctionSecretArgumentsFinder
             if (RE2::Replace(&url_arg, account_key_pattern, "AccountKey=[HIDDEN]\\1"))
             {
                 chassert(result.count == 0); /// We shouldn't use replacement with masking other arguments
-                result.start = url_arg_idx;
+                result.start = function->arguments->getRealIndex(url_arg_idx);
                 result.are_named = argument_is_named;
                 result.count = 1;
                 result.replacement = url_arg;
@@ -534,6 +606,7 @@ class FunctionSecretArgumentsFinder
     void findTableEngineSecretArguments()
     {
         const String & engine_name = function->name();
+
         if (engine_name == "ExternalDistributed")
         {
             /// ExternalDistributed('engine', 'host:port', 'database', 'table', 'user', 'password')
@@ -551,10 +624,13 @@ class FunctionSecretArgumentsFinder
         {
             findMongoDBSecretArguments();
         }
+        else if (engine_name == "Iceberg")
+        {
+            findIcebergTableEngineSecretArguments();
+        }
         else if ((engine_name == "S3") || (engine_name == "COSN") || (engine_name == "OSS")
                  || (engine_name == "DeltaLake") || (engine_name == "Hudi")
-                 || (engine_name == "Iceberg") || (engine_name == "IcebergS3")
-                 || (engine_name == "S3Queue"))
+                 || (engine_name == "IcebergS3") || (engine_name == "S3Queue"))
         {
             /// S3('url', ['aws_access_key_id', 'aws_secret_access_key',] ...)
             findS3TableEngineSecretArguments();
@@ -563,7 +639,7 @@ class FunctionSecretArgumentsFinder
         {
             findURLSecretArguments();
         }
-        else if (engine_name == "AzureBlobStorage" || engine_name == "AzureQueue")
+        else if (engine_name == "AzureBlobStorage" || engine_name == "AzureQueue" || engine_name == "IcebergAzure")
         {
             findAzureBlobStorageTableEngineSecretArguments();
         }
@@ -681,6 +757,18 @@ class FunctionSecretArgumentsFinder
         markSecretArgument(2);
     }
 
+    void findIcebergTableEngineSecretArguments()
+    {
+        auto storage_type = findIcebergStorageType();
+
+        if (storage_type == "s3")
+            findS3TableEngineSecretArguments();
+        else if (storage_type == "azure")
+            findAzureBlobStorageTableEngineSecretArguments();
+
+        function->arguments->unskipArguments();
+    }
+
     void findDatabaseEngineSecretArguments()
     {
         const String & engine_name = function->name();
diff --git a/src/Parsers/FunctionSecretArgumentsFinderAST.h b/src/Parsers/FunctionSecretArgumentsFinderAST.h
index a260c0d58da6..3624d7a7e87b 100644
--- a/src/Parsers/FunctionSecretArgumentsFinderAST.h
+++ b/src/Parsers/FunctionSecretArgumentsFinderAST.h
@@ -54,10 +54,13 @@ class FunctionAST : public AbstractFunction
     {
     public:
         explicit ArgumentsAST(const ASTs * arguments_) : arguments(arguments_) {}
-        size_t size() const override { return arguments ? arguments->size() : 0; }
+        size_t size() const override
+        { /// size withous skipped indexes
+            return arguments ? arguments->size() - skippedSize() : 0;
+        }
         std::unique_ptr<Argument> at(size_t n) const override
-        {
-            return std::make_unique<ArgumentAST>(arguments->at(n).get());
+        { /// n is relative index, some can be skipped
+            return std::make_unique<ArgumentAST>(arguments->at(getRealIndex(n)).get());
         }
     private:
         const ASTs * arguments = nullptr;
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 05fdfdd997b7..391a0f3e271e 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -23,6 +23,7 @@
 #include <IO/WriteBuffer.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/AsynchronousInsertQueue.h>
+#include <Interpreters/ClusterFunctionReadTask.h>
 #include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InternalTextLogsQueue.h>
 #include <Interpreters/Session.h>
@@ -34,7 +35,6 @@
 #include <Parsers/ASTInsertQuery.h>
 #include <Server/TCPServer.h>
 #include <Storages/MergeTree/MergeTreeDataPartUUID.h>
-#include <Storages/ObjectStorage/StorageObjectStorageCluster.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <base/defines.h>
 #include <base/scope_guard.h>
diff --git a/src/Storages/HivePartitioningUtils.cpp b/src/Storages/HivePartitioningUtils.cpp
index 86084717dd8e..060f04474e98 100644
--- a/src/Storages/HivePartitioningUtils.cpp
+++ b/src/Storages/HivePartitioningUtils.cpp
@@ -210,9 +210,9 @@ HivePartitionColumnsWithFileColumnsPair setupHivePartitioningForObjectStorage(
      * Otherwise, in case `use_hive_partitioning=1`, we can keep the old behavior of extracting it from the sample path.
      * And if the schema was inferred (not specified in the table definition), we need to enrich it with the path partition columns
      */
-    if (configuration->partition_strategy && configuration->partition_strategy_type == PartitionStrategyFactory::StrategyType::HIVE)
+    if (configuration->getPartitionStrategy() && configuration->getPartitionStrategyType() == PartitionStrategyFactory::StrategyType::HIVE)
     {
-        hive_partition_columns_to_read_from_file_path = configuration->partition_strategy->getPartitionColumns();
+        hive_partition_columns_to_read_from_file_path = configuration->getPartitionStrategy()->getPartitionColumns();
         sanityCheckSchemaAndHivePartitionColumns(hive_partition_columns_to_read_from_file_path, columns, /* check_contained_in_schema */true);
     }
     else if (context->getSettingsRef()[Setting::use_hive_partitioning])
@@ -226,7 +226,7 @@ HivePartitionColumnsWithFileColumnsPair setupHivePartitioningForObjectStorage(
         sanityCheckSchemaAndHivePartitionColumns(hive_partition_columns_to_read_from_file_path, columns, /* check_contained_in_schema */false);
     }
 
-    if (configuration->partition_columns_in_data_file)
+    if (configuration->getPartitionColumnsInDataFile())
     {
         file_columns = columns.getAllPhysical();
     }
diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index 96f5adbc2de5..7179dbbfa8ee 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -71,6 +71,9 @@ using ConditionSelectivityEstimatorPtr = std::shared_ptr<ConditionSelectivityEst
 
 struct RangesInDataParts;
 
+class IObjectStorage;
+using ObjectStoragePtr = std::shared_ptr<IObjectStorage>;
+
 class ActionsDAG;
 
 /** Storage. Describes the table. Responsible for
diff --git a/src/Storages/IStorageCluster.cpp b/src/Storages/IStorageCluster.cpp
index c6c69c0f21bc..b49f13435c0e 100644
--- a/src/Storages/IStorageCluster.cpp
+++ b/src/Storages/IStorageCluster.cpp
@@ -37,6 +37,12 @@ namespace Setting
     extern const SettingsBool parallel_replicas_local_plan;
     extern const SettingsString cluster_for_parallel_replicas;
     extern const SettingsNonZeroUInt64 max_parallel_replicas;
+    extern const SettingsUInt64 object_storage_max_nodes;
+}
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
 }
 
 namespace ErrorCodes
@@ -131,15 +137,23 @@ void IStorageCluster::read(
     SelectQueryInfo & query_info,
     ContextPtr context,
     QueryProcessingStage::Enum processed_stage,
-    size_t /*max_block_size*/,
-    size_t /*num_streams*/)
+    size_t max_block_size,
+    size_t num_streams)
 {
+    auto cluster_name_from_settings = getClusterName(context);
+
+    if (cluster_name_from_settings.empty())
+    {
+        readFallBackToPure(query_plan, column_names, storage_snapshot, query_info, context, processed_stage, max_block_size, num_streams);
+        return;
+    }
+
     updateConfigurationIfNeeded(context);
 
     storage_snapshot->check(column_names);
 
     updateBeforeRead(context);
-    auto cluster = getCluster(context);
+    auto cluster = getClusterImpl(context, cluster_name_from_settings, context->getSettingsRef()[Setting::object_storage_max_nodes]);
 
     /// Calculate the header. This is significant, because some columns could be thrown away in some cases like query with count(*)
 
@@ -186,6 +200,20 @@ void IStorageCluster::read(
     query_plan.addStep(std::move(reading));
 }
 
+SinkToStoragePtr IStorageCluster::write(
+    const ASTPtr & query,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr context,
+    bool async_insert)
+{
+    auto cluster_name_from_settings = getClusterName(context);
+
+    if (cluster_name_from_settings.empty())
+        return writeFallBackToPure(query, metadata_snapshot, context, async_insert);
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method write is not supported by storage {}", getName());
+}
+
 void ReadFromCluster::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
     const Scalars & scalars = context->hasQueryContext() ? context->getQueryContext()->getScalars() : Scalars{};
@@ -278,9 +306,9 @@ ContextPtr ReadFromCluster::updateSettings(const Settings & settings)
     return new_context;
 }
 
-ClusterPtr IStorageCluster::getCluster(ContextPtr context) const
+ClusterPtr IStorageCluster::getClusterImpl(ContextPtr context, const String & cluster_name_, size_t max_hosts)
 {
-    return context->getCluster(cluster_name)->getClusterWithReplicasAsShards(context->getSettingsRef());
+    return context->getCluster(cluster_name_)->getClusterWithReplicasAsShards(context->getSettingsRef(), /* max_replicas_from_shard */ 0, max_hosts);
 }
 
 }
diff --git a/src/Storages/IStorageCluster.h b/src/Storages/IStorageCluster.h
index 3248b26b8c5e..d63d9f597453 100644
--- a/src/Storages/IStorageCluster.h
+++ b/src/Storages/IStorageCluster.h
@@ -30,10 +30,16 @@ class IStorageCluster : public IStorage
         SelectQueryInfo & query_info,
         ContextPtr context,
         QueryProcessingStage::Enum processed_stage,
-        size_t /*max_block_size*/,
-        size_t /*num_streams*/) override;
+        size_t max_block_size,
+        size_t num_streams) override;
 
-    ClusterPtr getCluster(ContextPtr context) const;
+    SinkToStoragePtr write(
+        const ASTPtr & query,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr context,
+        bool async_insert) override;
+
+    ClusterPtr getCluster(ContextPtr context) const { return getClusterImpl(context, cluster_name); }
 
     /// Query is needed for pruning by virtual columns (_file, _path)
     virtual RemoteQueryExecutor::Extension getTaskIteratorExtension(
@@ -51,13 +57,39 @@ class IStorageCluster : public IStorage
     bool supportsOptimizationToSubcolumns() const override { return false; }
     bool supportsTrivialCountOptimization(const StorageSnapshotPtr &, ContextPtr) const override { return true; }
 
+    const String & getOriginalClusterName() const { return cluster_name; }
+    virtual String getClusterName(ContextPtr /* context */) const { return getOriginalClusterName(); }
+
 protected:
     virtual void updateBeforeRead(const ContextPtr &) {}
     virtual void updateQueryToSendIfNeeded(ASTPtr & /*query*/, const StorageSnapshotPtr & /*storage_snapshot*/, const ContextPtr & /*context*/) {}
 
     virtual void updateConfigurationIfNeeded(ContextPtr /* context */) {}
+    virtual void readFallBackToPure(
+        QueryPlan & /* query_plan */,
+        const Names & /* column_names */,
+        const StorageSnapshotPtr & /* storage_snapshot */,
+        SelectQueryInfo & /* query_info */,
+        ContextPtr /* context */,
+        QueryProcessingStage::Enum /* processed_stage */,
+        size_t /* max_block_size */,
+        size_t /* num_streams */)
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method readFallBackToPure is not supported by storage {}", getName());
+    }
+    
+    virtual SinkToStoragePtr writeFallBackToPure(
+        const ASTPtr & /*query*/,
+        const StorageMetadataPtr & /*metadata_snapshot*/,
+        ContextPtr /*context*/,
+        bool /*async_insert*/)
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method writeFallBackToPure is not supported by storage {}", getName());
+    }
 
 private:
+    static ClusterPtr getClusterImpl(ContextPtr context, const String & cluster_name_, size_t max_hosts = 0);
+
     LoggerPtr log;
     String cluster_name;
 };
diff --git a/src/Storages/ObjectStorage/Azure/Configuration.cpp b/src/Storages/ObjectStorage/Azure/Configuration.cpp
index 2a612579445b..b8b1ccc3781e 100644
--- a/src/Storages/ObjectStorage/Azure/Configuration.cpp
+++ b/src/Storages/ObjectStorage/Azure/Configuration.cpp
@@ -65,6 +65,7 @@ const std::unordered_set<std::string_view> optional_configuration_keys = {
     "partition_columns_in_data_file",
     "client_id",
     "tenant_id",
+    "storage_type",
 };
 
 void StorageAzureConfiguration::check(ContextPtr context)
@@ -208,10 +209,6 @@ void AzureStorageParsedArguments::fromNamedCollection(const NamedCollection & co
 
     String connection_url;
     String container_name;
-    std::optional<String> account_name;
-    std::optional<String> account_key;
-    std::optional<String> client_id;
-    std::optional<String> tenant_id;
 
     if (collection.has("connection_string"))
         connection_url = collection.get<String>("connection_string");
@@ -392,16 +389,10 @@ void AzureStorageParsedArguments::fromAST(ASTs & engine_args, ContextPtr context
 
     std::unordered_map<std::string_view, size_t> engine_args_to_idx;
 
-
     String connection_url = checkAndGetLiteralArgument<String>(engine_args[0], "connection_string/storage_account_url");
     String container_name = checkAndGetLiteralArgument<String>(engine_args[1], "container");
     blob_path = checkAndGetLiteralArgument<String>(engine_args[2], "blobpath");
 
-    std::optional<String> account_name;
-    std::optional<String> account_key;
-    std::optional<String> client_id;
-    std::optional<String> tenant_id;
-
     collectCredentials(extra_credentials, client_id, tenant_id, context);
 
     auto is_format_arg = [] (const std::string & s) -> bool
@@ -451,8 +442,7 @@ void AzureStorageParsedArguments::fromAST(ASTs & engine_args, ContextPtr context
             auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "partition_strategy/structure");
             if (magic_enum::enum_contains<PartitionStrategyFactory::StrategyType>(sixth_arg, magic_enum::case_insensitive))
             {
-                partition_strategy_type
-                    = magic_enum::enum_cast<PartitionStrategyFactory::StrategyType>(sixth_arg, magic_enum::case_insensitive).value();
+                partition_strategy_type = magic_enum::enum_cast<PartitionStrategyFactory::StrategyType>(sixth_arg, magic_enum::case_insensitive).value();
             }
             else
             {
@@ -572,8 +562,7 @@ void AzureStorageParsedArguments::fromAST(ASTs & engine_args, ContextPtr context
             auto eighth_arg = checkAndGetLiteralArgument<String>(engine_args[7], "partition_strategy/structure");
             if (magic_enum::enum_contains<PartitionStrategyFactory::StrategyType>(eighth_arg, magic_enum::case_insensitive))
             {
-                partition_strategy_type
-                    = magic_enum::enum_cast<PartitionStrategyFactory::StrategyType>(eighth_arg, magic_enum::case_insensitive).value();
+                partition_strategy_type = magic_enum::enum_cast<PartitionStrategyFactory::StrategyType>(eighth_arg, magic_enum::case_insensitive).value();
             }
             else
             {
@@ -825,6 +814,26 @@ void StorageAzureConfiguration::initializeFromParsedArguments(const AzureStorage
     StorageObjectStorageConfiguration::initializeFromParsedArguments(parsed_arguments);
     blob_path = parsed_arguments.blob_path;
     connection_params = parsed_arguments.connection_params;
+    account_name = parsed_arguments.account_name;
+    account_key = parsed_arguments.account_key;
+    client_id = parsed_arguments.client_id;
+    tenant_id = parsed_arguments.tenant_id;
+}
+
+ASTPtr StorageAzureConfiguration::createArgsWithAccessData() const
+{
+    auto arguments = make_intrusive<ASTExpressionList>();
+
+    arguments->children.push_back(make_intrusive<ASTLiteral>(connection_params.endpoint.storage_account_url));
+    arguments->children.push_back(make_intrusive<ASTIdentifier>(connection_params.endpoint.container_name));
+    arguments->children.push_back(make_intrusive<ASTLiteral>(blob_path.path));
+    if (account_name && account_key)
+    {
+        arguments->children.push_back(make_intrusive<ASTLiteral>(*account_name));
+        arguments->children.push_back(make_intrusive<ASTLiteral>(*account_key));
+    }
+
+    return arguments;
 }
 
 void StorageAzureConfiguration::addStructureAndFormatToArgsIfNeeded(
@@ -832,13 +841,13 @@ void StorageAzureConfiguration::addStructureAndFormatToArgsIfNeeded(
 {
     if (disk)
     {
-        if (format == "auto")
+        if (getFormat() == "auto")
         {
             ASTs format_equal_func_args = {make_intrusive<ASTIdentifier>("format"), make_intrusive<ASTLiteral>(format_)};
             auto format_equal_func = makeASTFunction("equals", std::move(format_equal_func_args));
             args.push_back(format_equal_func);
         }
-        if (structure == "auto")
+        if (getStructure() == "auto")
         {
             ASTs structure_equal_func_args = {make_intrusive<ASTIdentifier>("structure"), make_intrusive<ASTLiteral>(structure_)};
             auto structure_equal_func = makeASTFunction("equals", std::move(structure_equal_func_args));
diff --git a/src/Storages/ObjectStorage/Azure/Configuration.h b/src/Storages/ObjectStorage/Azure/Configuration.h
index 61618e3b8340..0bdef02a11f6 100644
--- a/src/Storages/ObjectStorage/Azure/Configuration.h
+++ b/src/Storages/ObjectStorage/Azure/Configuration.h
@@ -76,6 +76,11 @@ struct AzureStorageParsedArguments : private StorageParsedArguments
 
     Path blob_path;
     AzureBlobStorage::ConnectionParams connection_params;
+
+    std::optional<std::string> account_name;
+    std::optional<std::string> account_key;
+    std::optional<std::string> client_id;
+    std::optional<std::string> tenant_id;
 };
 
 class StorageAzureConfiguration : public StorageObjectStorageConfiguration
@@ -124,6 +129,7 @@ class StorageAzureConfiguration : public StorageObjectStorageConfiguration
         onelake_client_secret = client_secret_;
         onelake_tenant_id = tenant_id_;
     }
+    ASTPtr createArgsWithAccessData() const override;
 
 protected:
     void fromDisk(const String & disk_name, ASTs & args, ContextPtr context, bool with_structure) override;
@@ -135,14 +141,21 @@ class StorageAzureConfiguration : public StorageObjectStorageConfiguration
     Path blob_path;
     Paths blobs_paths;
     AzureBlobStorage::ConnectionParams connection_params;
-    DiskPtr disk;
+
+    std::optional<std::string> account_name;
+    std::optional<std::string> account_key;
+    std::optional<std::string> client_id;
+    std::optional<std::string> tenant_id;
 
     String onelake_client_id;
     String onelake_client_secret;
     String onelake_tenant_id;
 
+    DiskPtr disk;
+
     void initializeFromParsedArguments(const AzureStorageParsedArguments & parsed_arguments);
 };
+
 }
 
 #endif
diff --git a/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h b/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
index 0dc4e6b7653d..80fc5c4e2cad 100644
--- a/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
+++ b/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
@@ -2,6 +2,7 @@
 #include "config.h"
 
 #include <Storages/IStorage.h>
+#include <Storages/NamedCollectionsHelpers.h>
 #include <Storages/ObjectStorage/Azure/Configuration.h>
 #include <Storages/ObjectStorage/DataLakes/DeltaLakeMetadata.h>
 #include <Storages/ObjectStorage/DataLakes/HudiMetadata.h>
@@ -12,11 +13,16 @@
 #include <Storages/ObjectStorage/HDFS/Configuration.h>
 #include <Storages/ObjectStorage/Local/Configuration.h>
 #include <Storages/ObjectStorage/S3/Configuration.h>
-#include <Storages/ObjectStorage/StorageObjectStorage.h>
+#include <Storages/ObjectStorage/StorageObjectStorageConfiguration.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/ColumnsDescription.h>
 #include <Formats/FormatFilterInfo.h>
 #include <Formats/FormatParserSharedResources.h>
+#include <Parsers/ASTLiteral.h>
+#include <Parsers/ASTFunction.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Disks/DiskType.h>
+
 #include <memory>
 #include <string>
 
@@ -124,13 +130,13 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     bool supportsDelete() const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->supportsDelete();
     }
 
     bool supportsParallelInsert() const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->supportsParallelInsert();
     }
 
@@ -141,25 +147,25 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
         std::shared_ptr<DataLake::ICatalog> catalog,
         const std::optional<FormatSettings> & format_settings) override
     {
-        assertInitialized();
+        assertInitializedDL();
         current_metadata->mutate(commands, shared_from_this(), context, storage_id, metadata_snapshot, catalog, format_settings);
     }
 
     void checkMutationIsPossible(const MutationCommands & commands) override
     {
-        assertInitialized();
+        assertInitializedDL();
         current_metadata->checkMutationIsPossible(commands);
     }
 
     void checkAlterIsPossible(const AlterCommands & commands) override
     {
-        assertInitialized();
+        assertInitializedDL();
         current_metadata->checkAlterIsPossible(commands);
     }
 
     void alter(const AlterCommands & params, ContextPtr context) override
     {
-        assertInitialized();
+        assertInitializedDL();
         current_metadata->alter(params, context);
 
     }
@@ -173,7 +179,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     std::optional<ColumnsDescription> tryGetTableStructureFromMetadata(ContextPtr local_context) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         if (auto schema = current_metadata->getTableSchema(local_context); !schema.empty())
             return ColumnsDescription(std::move(schema));
         return std::nullopt;
@@ -181,37 +187,37 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     std::optional<size_t> totalRows(ContextPtr local_context) override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->totalRows(local_context);
     }
 
     std::optional<size_t> totalBytes(ContextPtr local_context) override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->totalBytes(local_context);
     }
 
     bool isDataSortedBySortingKey(StorageMetadataPtr metadata_snapshot, ContextPtr local_context) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->isDataSortedBySortingKey(metadata_snapshot, local_context);
     }
 
     std::shared_ptr<NamesAndTypesList> getInitialSchemaByPath(ContextPtr local_context, ObjectInfoPtr object_info) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->getInitialSchemaByPath(local_context, object_info);
     }
 
     std::shared_ptr<const ActionsDAG> getSchemaTransformer(ContextPtr local_context, ObjectInfoPtr object_info) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->getSchemaTransformer(local_context, object_info);
     }
 
     StorageInMemoryMetadata getStorageSnapshotMetadata(ContextPtr context) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->getStorageSnapshotMetadata(context);
     }
 
@@ -226,7 +232,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     IDataLakeMetadata * getExternalMetadata() override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata.get();
     }
 
@@ -234,7 +240,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     bool supportsWrites() const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->supportsWrites();
     }
 
@@ -245,7 +251,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
         StorageMetadataPtr storage_metadata,
         ContextPtr context) override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->iterate(filter_dag, callback, list_batch_size, storage_metadata, context);
     }
 
@@ -257,7 +263,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
     /// because the code will be removed ASAP anyway)
     DeltaLakePartitionColumns getDeltaLakePartitionColumns() const
     {
-        assertInitialized();
+        assertInitializedDL();
         const auto * delta_lake_metadata = dynamic_cast<const DeltaLakeMetadata *>(current_metadata.get());
         if (delta_lake_metadata)
             return delta_lake_metadata->getPartitionColumns();
@@ -267,18 +273,18 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     void modifyFormatSettings(FormatSettings & settings_, const Context & local_context) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         current_metadata->modifyFormatSettings(settings_, local_context);
     }
 
     ColumnMapperPtr getColumnMapperForObject(ObjectInfoPtr object_info) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->getColumnMapperForObject(object_info);
     }
     ColumnMapperPtr getColumnMapperForCurrentSchema(StorageMetadataPtr storage_metadata_snapshot, ContextPtr context) const override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->getColumnMapperForCurrentSchema(storage_metadata_snapshot, context);
     }
 
@@ -347,7 +353,7 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
 
     bool optimize(const StorageMetadataPtr & metadata_snapshot, ContextPtr context, const std::optional<FormatSettings> & format_settings) override
     {
-        assertInitialized();
+        assertInitializedDL();
         return current_metadata->optimize(metadata_snapshot, context, format_settings);
     }
 
@@ -372,8 +378,9 @@ class DataLakeConfiguration : public BaseStorageConfiguration, public std::enabl
     const DataLakeStorageSettingsPtr settings;
     ObjectStoragePtr ready_object_storage;
 
-    void assertInitialized() const
+    void assertInitializedDL() const
     {
+        BaseStorageConfiguration::assertInitialized();
         if (!current_metadata)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Metadata is not initialized");
     }
@@ -406,18 +413,361 @@ using StorageS3IcebergConfiguration = DataLakeConfiguration<StorageS3Configurati
 using StorageS3PaimonConfiguration = DataLakeConfiguration<StorageS3Configuration, PaimonMetadata>;
 #endif
 
-#if USE_AZURE_BLOB_STORAGE
+#    if USE_AZURE_BLOB_STORAGE
 using StorageAzureIcebergConfiguration = DataLakeConfiguration<StorageAzureConfiguration, IcebergMetadata>;
 using StorageAzurePaimonConfiguration = DataLakeConfiguration<StorageAzureConfiguration, PaimonMetadata>;
 #endif
 
-#if USE_HDFS
+#    if USE_HDFS
 using StorageHDFSIcebergConfiguration = DataLakeConfiguration<StorageHDFSConfiguration, IcebergMetadata>;
 using StorageHDFSPaimonConfiguration = DataLakeConfiguration<StorageHDFSConfiguration, PaimonMetadata>;
 #endif
 
 using StorageLocalIcebergConfiguration = DataLakeConfiguration<StorageLocalConfiguration, IcebergMetadata>;
 using StorageLocalPaimonConfiguration = DataLakeConfiguration<StorageLocalConfiguration, PaimonMetadata>;
+
+/// Class detects storage type by `storage_type` parameter if exists
+/// and uses appropriate implementation - S3, Azure, HDFS or Local
+class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, public std::enable_shared_from_this<StorageObjectStorageConfiguration>
+{
+    friend class StorageObjectStorageConfiguration;
+
+public:
+    explicit StorageIcebergConfiguration(DataLakeStorageSettingsPtr settings_) : settings(settings_) {}
+ 
+    ObjectStorageType getType() const override { return getImpl().getType(); }
+
+    std::string getTypeName() const override { return getImpl().getTypeName(); }
+    std::string getEngineName() const override { return getImpl().getEngineName(); }
+    std::string getNamespaceType() const override { return getImpl().getNamespaceType(); }
+
+    Path getRawPath() const override { return getImpl().getRawPath(); }
+    const String & getRawURI() const override { return getImpl().getRawURI(); }
+    const Path & getPathForRead() const override { return getImpl().getPathForRead(); }
+    Path getPathForWrite(const std::string & partition_id) const override { return getImpl().getPathForWrite(partition_id); }
+
+    void setPathForRead(const Path & path) override { getImpl().setPathForRead(path); }
+
+    const Paths & getPaths() const override { return getImpl().getPaths(); }
+    void setPaths(const Paths & paths) override { getImpl().setPaths(paths); }
+
+    String getDataSourceDescription() const override { return getImpl().getDataSourceDescription(); }
+    String getNamespace() const override { return getImpl().getNamespace(); }
+
+    StorageObjectStorageQuerySettings getQuerySettings(const ContextPtr & context) const override
+        { return getImpl().getQuerySettings(context); }
+
+    void addStructureAndFormatToArgsIfNeeded(
+        ASTs & args, const String & structure_, const String & format_, ContextPtr context, bool with_structure) override
+        { getImpl().addStructureAndFormatToArgsIfNeeded(args, structure_, format_, context, with_structure); }
+
+    bool isNamespaceWithGlobs() const override { return getImpl().isNamespaceWithGlobs(); }
+
+    bool isArchive() const override { return getImpl().isArchive(); }
+    bool isPathInArchiveWithGlobs() const override { return getImpl().isPathInArchiveWithGlobs(); }
+    std::string getPathInArchive() const override { return getImpl().getPathInArchive(); }
+
+    void check(ContextPtr context) override { getImpl().check(context); }
+    void validateNamespace(const String & name) const override { getImpl().validateNamespace(name); }
+
+    ObjectStoragePtr createObjectStorage(ContextPtr context, bool is_readonly) override
+        { return getImpl().createObjectStorage(context, is_readonly); }
+    bool isStaticConfiguration() const override { return getImpl().isStaticConfiguration(); }
+
+    bool isDataLakeConfiguration() const override { return getImpl().isDataLakeConfiguration(); }
+
+    std::optional<size_t> totalRows(ContextPtr context) override { return getImpl().totalRows(context); }
+    std::optional<size_t> totalBytes(ContextPtr context) override { return getImpl().totalBytes(context); }
+
+    IDataLakeMetadata * getExternalMetadata() override { return getImpl().getExternalMetadata(); }
+
+    std::shared_ptr<NamesAndTypesList> getInitialSchemaByPath(ContextPtr context, ObjectInfoPtr object_info) const override
+        { return getImpl().getInitialSchemaByPath(context, object_info); }
+
+    std::shared_ptr<const ActionsDAG> getSchemaTransformer(ContextPtr context, ObjectInfoPtr object_info) const override
+        { return getImpl().getSchemaTransformer(context, object_info); }
+
+    void modifyFormatSettings(FormatSettings & settings_, const Context & context) const override
+        { getImpl().modifyFormatSettings(settings_, context); }
+
+    void addDeleteTransformers(
+        ObjectInfoPtr object_info,
+        QueryPipelineBuilder & builder,
+        const std::optional<FormatSettings> & format_settings,
+        FormatParserSharedResourcesPtr parser_shared_resources,
+        ContextPtr local_context) const override
+        { getImpl().addDeleteTransformers(object_info, builder, format_settings, parser_shared_resources, local_context); }
+
+    ReadFromFormatInfo prepareReadingFromFormat(
+        ObjectStoragePtr object_storage,
+        const Strings & requested_columns,
+        const StorageSnapshotPtr & storage_snapshot,
+        bool supports_subset_of_columns,
+        bool supports_tuple_elements,
+        ContextPtr local_context,
+        const PrepareReadingFromFormatHiveParams & hive_parameters) override
+    {
+        return getImpl().prepareReadingFromFormat(
+            object_storage,
+            requested_columns,
+            storage_snapshot,
+            supports_subset_of_columns,
+            supports_tuple_elements,
+            local_context,
+            hive_parameters);
+    }
+
+    void initPartitionStrategy(ASTPtr partition_by, const ColumnsDescription & columns, ContextPtr context) override
+        { getImpl().initPartitionStrategy(partition_by, columns, context); }
+
+    std::optional<ColumnsDescription> tryGetTableStructureFromMetadata(ContextPtr local_context) const override
+        { return getImpl().tryGetTableStructureFromMetadata(local_context); }
+
+    bool supportsFileIterator() const override { return getImpl().supportsFileIterator(); }
+    bool supportsWrites() const override { return getImpl().supportsWrites(); }
+
+    bool supportsPartialPathPrefix() const override { return getImpl().supportsPartialPathPrefix(); }
+
+    ObjectIterator iterate(
+        const ActionsDAG * filter_dag,
+        IDataLakeMetadata::FileProgressCallback callback,
+        size_t list_batch_size,
+        StorageMetadataPtr storage_metadata,
+        ContextPtr context) override
+    {
+        return getImpl().iterate(filter_dag, callback, list_batch_size, storage_metadata, context);
+    }
+
+    void update(
+        ObjectStoragePtr object_storage_ptr,
+        ContextPtr context,
+        bool if_not_updated_before) override
+    {
+        getImpl().update(object_storage_ptr, context, if_not_updated_before);
+    }
+
+    void create(
+        ObjectStoragePtr object_storage,
+        ContextPtr local_context,
+        const std::optional<ColumnsDescription> & columns,
+        ASTPtr partition_by,
+        ASTPtr order_by,
+        bool if_not_exists,
+        std::shared_ptr<DataLake::ICatalog> catalog,
+        const StorageID & table_id_) override
+    {
+        getImpl().create(object_storage, local_context, columns, partition_by, order_by, if_not_exists, catalog, table_id_);
+    }
+
+    SinkToStoragePtr write(
+        SharedHeader sample_block,
+        const StorageID & table_id,
+        ObjectStoragePtr object_storage,
+        const std::optional<FormatSettings> & format_settings,
+        ContextPtr context,
+        std::shared_ptr<DataLake::ICatalog> catalog) override
+    {
+        return getImpl().write(sample_block, table_id, object_storage, format_settings, context, catalog);
+    }
+
+    bool supportsDelete() const override { return getImpl().supportsDelete(); }
+    void mutate(const MutationCommands & commands,
+        ContextPtr context,
+        const StorageID & storage_id,
+        StorageMetadataPtr metadata_snapshot,
+        std::shared_ptr<DataLake::ICatalog> catalog,
+        const std::optional<FormatSettings> & format_settings) override
+    {
+        getImpl().mutate(commands, context, storage_id, metadata_snapshot, catalog, format_settings);
+    }
+
+    void checkMutationIsPossible(const MutationCommands & commands) override { getImpl().checkMutationIsPossible(commands); }
+
+    void checkAlterIsPossible(const AlterCommands & commands) override { getImpl().checkAlterIsPossible(commands); }
+
+    void alter(const AlterCommands & params, ContextPtr context) override { getImpl().alter(params, context); }
+
+    const DataLakeStorageSettings & getDataLakeSettings() const override { return getImpl().getDataLakeSettings(); }
+
+    void initialize(
+        ASTs & engine_args,
+        ContextPtr local_context,
+        bool with_table_structure) override
+    {
+        createDynamicConfiguration(engine_args, local_context);
+        getImpl().initialize(engine_args, local_context, with_table_structure);
+    }
+
+    ASTPtr createArgsWithAccessData() const override
+    {
+        return getImpl().createArgsWithAccessData();
+    }
+
+    void fromNamedCollection(const NamedCollection & collection, ContextPtr context) override
+        { getImpl().fromNamedCollection(collection, context); }
+    void fromAST(ASTs & args, ContextPtr context, bool with_structure) override
+        { getImpl().fromAST(args, context, with_structure); }
+
+    const String & getFormat() const override { return getImpl().getFormat(); }
+    const String & getCompressionMethod() const override { return getImpl().getCompressionMethod(); }
+    const String & getStructure() const override { return getImpl().getStructure(); }
+
+    PartitionStrategyFactory::StrategyType getPartitionStrategyType() const override { return getImpl().getPartitionStrategyType(); }
+    bool getPartitionColumnsInDataFile() const override { return getImpl().getPartitionColumnsInDataFile(); }
+    std::shared_ptr<IPartitionStrategy> getPartitionStrategy() const override { return getImpl().getPartitionStrategy(); }
+
+    void setFormat(const String & format_) override { getImpl().setFormat(format_); }
+    void setCompressionMethod(const String & compression_method_) override { getImpl().setCompressionMethod(compression_method_); }
+    void setStructure(const String & structure_) override { getImpl().setStructure(structure_); }
+
+    void setPartitionStrategyType(PartitionStrategyFactory::StrategyType partition_strategy_type_) override
+        { getImpl().setPartitionStrategyType(partition_strategy_type_); }
+    void setPartitionColumnsInDataFile(bool partition_columns_in_data_file_) override
+        { getImpl().setPartitionColumnsInDataFile(partition_columns_in_data_file_); }
+    void setPartitionStrategy(const std::shared_ptr<IPartitionStrategy> & partition_strategy_) override
+        { getImpl().setPartitionStrategy(partition_strategy_); }
+
+    ColumnMapperPtr getColumnMapperForObject(ObjectInfoPtr obj) const override { return getImpl().getColumnMapperForObject(obj); }
+
+    ColumnMapperPtr getColumnMapperForCurrentSchema(StorageMetadataPtr storage_metadata_snapshot, ContextPtr context) const override
+        { return getImpl().getColumnMapperForCurrentSchema(storage_metadata_snapshot, context); }
+
+    std::shared_ptr<DataLake::ICatalog> getCatalog(ContextPtr context, bool is_attach) const override
+        { return getImpl().getCatalog(context, is_attach); }
+
+    bool optimize(const StorageMetadataPtr & metadata_snapshot, ContextPtr context, const std::optional<FormatSettings> & format_settings) override
+        { return getImpl().optimize(metadata_snapshot, context, format_settings); }
+
+    StorageInMemoryMetadata getStorageSnapshotMetadata(ContextPtr local_context) const override
+        { return getImpl().getStorageSnapshotMetadata(local_context); }
+
+protected:
+    /// Find storage_type argument and remove it from args if exists.
+    /// Return storage type.
+    ObjectStorageType extractDynamicStorageType(ASTs & args, ContextPtr context, ASTPtr * type_arg) const override
+    {
+        static const auto * const storage_type_name = "storage_type";
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(args, context))
+        {
+            if (named_collection->has(storage_type_name))
+            {
+                return objectStorageTypeFromString(named_collection->get<String>(storage_type_name));
+            }
+        }
+
+        auto type_it = args.end();
+
+        /// S3 by default for backward compatibility
+        /// Iceberg without storage_type == IcebergS3
+        ObjectStorageType type = ObjectStorageType::S3;
+
+        for (auto arg_it = args.begin(); arg_it != args.end(); ++arg_it)
+        {
+            const auto * type_ast_function = (*arg_it)->as<ASTFunction>();
+
+            if (type_ast_function && type_ast_function->name == "equals"
+                && type_ast_function->arguments && type_ast_function->arguments->children.size() == 2)
+            {
+                auto * name = type_ast_function->arguments->children[0]->as<ASTIdentifier>();
+
+                if (name && name->name() == storage_type_name)
+                {
+                    if (type_it != args.end())
+                    {
+                        throw Exception(
+                            ErrorCodes::BAD_ARGUMENTS,
+                            "DataLake can have only one key-value argument: storage_type='type'.");
+                    }
+
+                    auto * value = type_ast_function->arguments->children[1]->as<ASTLiteral>();
+
+                    if (!value)
+                    {
+                        throw Exception(
+                            ErrorCodes::BAD_ARGUMENTS,
+                            "DataLake parameter 'storage_type' has wrong type, string literal expected.");
+                    }
+
+                    if (value->value.getType() != Field::Types::String)
+                    {
+                        throw Exception(
+                            ErrorCodes::BAD_ARGUMENTS,
+                            "DataLake parameter 'storage_type' has wrong value type, string expected.");
+                    }
+
+                    type = objectStorageTypeFromString(value->value.safeGet<String>());
+
+                    type_it = arg_it;
+                }
+            }
+        }
+
+        if (type_it != args.end())
+        {
+            if (type_arg)
+                *type_arg = *type_it;
+            args.erase(type_it);
+        }
+
+        return type;
+    }
+
+    void createDynamicConfiguration(ASTs & args, ContextPtr context)
+    {
+        ObjectStorageType type = extractDynamicStorageType(args, context, nullptr);
+        createDynamicStorage(type);
+    }
+
+    void assertInitialized() const override { getImpl().assertInitialized(); }
+
+private:
+    inline StorageObjectStorageConfiguration & getImpl() const
+    {
+        if (!impl)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Dynamic DataLake storage not initialized");
+
+        return *impl;
+    }
+
+    void createDynamicStorage(ObjectStorageType type)
+    {
+        if (impl)
+        {
+            if (impl->getType() == type)
+                return;
+
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Can't change datalake engine storage");
+        }
+
+        switch (type)
+        {
+#    if USE_AWS_S3
+            case ObjectStorageType::S3:
+                impl = std::make_unique<StorageS3IcebergConfiguration>(settings);
+                break;
+#    endif
+#    if USE_AZURE_BLOB_STORAGE
+            case ObjectStorageType::Azure:
+                impl = std::make_unique<StorageAzureIcebergConfiguration>(settings);
+                break;
+#    endif
+#    if USE_HDFS
+            case ObjectStorageType::HDFS:
+                impl = std::make_unique<StorageHDFSIcebergConfiguration>(settings);
+                break;
+#    endif
+            case ObjectStorageType::Local:
+                impl = std::make_unique<StorageLocalIcebergConfiguration>(settings);
+                break;
+            default:
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unsuported DataLake storage {}", type);
+        }
+    }
+
+    StorageObjectStorageConfigurationPtr impl;
+    DataLakeStorageSettingsPtr settings;
+};
 #endif
 
 #if USE_PARQUET
diff --git a/src/Storages/ObjectStorage/DataLakes/DataLakeStorageSettings.h b/src/Storages/ObjectStorage/DataLakes/DataLakeStorageSettings.h
index 3d6ad55544af..f5e9019eada4 100644
--- a/src/Storages/ObjectStorage/DataLakes/DataLakeStorageSettings.h
+++ b/src/Storages/ObjectStorage/DataLakes/DataLakeStorageSettings.h
@@ -57,6 +57,9 @@ If enabled, the engine would use the metadata file with the most recent last_upd
 )", 0) \
     DECLARE(Bool, iceberg_use_version_hint, false, R"(
 Get latest metadata path from version-hint.text file.
+)", 0) \
+    DECLARE(String, object_storage_cluster, "", R"(
+Cluster for distributed requests
 )", 0) \
     DECLARE(NonZeroUInt64, iceberg_format_version, 2, R"(
 Metadata format version.
diff --git a/src/Storages/ObjectStorage/DataLakes/DeltaLakeMetadataDeltaKernel.cpp b/src/Storages/ObjectStorage/DataLakes/DeltaLakeMetadataDeltaKernel.cpp
index c2ed2aac95b2..bdda2508d339 100644
--- a/src/Storages/ObjectStorage/DataLakes/DeltaLakeMetadataDeltaKernel.cpp
+++ b/src/Storages/ObjectStorage/DataLakes/DeltaLakeMetadataDeltaKernel.cpp
@@ -86,7 +86,7 @@ DeltaLakeMetadataDeltaKernel::DeltaLakeMetadataDeltaKernel(
             object_storage,
             context,
             log))
-    , format_name(configuration_.lock()->format)
+    , format_name(configuration_.lock()->getFormat())
 {
     object_storage_common = object_storage;
 #ifdef DEBUG_OR_SANITIZER_BUILD
@@ -406,8 +406,8 @@ SinkToStoragePtr DeltaLakeMetadataDeltaKernel::write(
             context,
             sample_block,
             format_settings,
-            configuration->format,
-            configuration->compression_method);
+            configuration->getFormat(),
+            configuration->getCompressionMethod());
     }
 
     return std::make_shared<DeltaLakePartitionedSink>(
@@ -417,8 +417,8 @@ SinkToStoragePtr DeltaLakeMetadataDeltaKernel::write(
         context,
         sample_block,
         format_settings,
-        configuration->format,
-        configuration->compression_method);
+        configuration->getFormat(),
+        configuration->getCompressionMethod());
 }
 
 void DeltaLakeMetadataDeltaKernel::logMetadataFiles(ContextPtr context) const
diff --git a/src/Storages/ObjectStorage/DataLakes/HudiMetadata.cpp b/src/Storages/ObjectStorage/DataLakes/HudiMetadata.cpp
index 81fd17be94ac..cc33bdb0df49 100644
--- a/src/Storages/ObjectStorage/DataLakes/HudiMetadata.cpp
+++ b/src/Storages/ObjectStorage/DataLakes/HudiMetadata.cpp
@@ -89,7 +89,7 @@ HudiMetadata::HudiMetadata(ObjectStoragePtr object_storage_, StorageObjectStorag
     : WithContext(context_)
     , object_storage(object_storage_)
     , table_path(configuration_->getPathForRead().path)
-    , format(configuration_->format)
+    , format(configuration_->getFormat())
 {
 }
 
diff --git a/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.cpp b/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.cpp
index 3ce0a2ee4838..2430da494142 100644
--- a/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.cpp
+++ b/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.cpp
@@ -202,7 +202,7 @@ IcebergMetadata::IcebergMetadata(
     , object_storage(std::move(object_storage_))
     , persistent_components(initializePersistentTableComponents(configuration_, cache_ptr, context_))
     , data_lake_settings(configuration_->getDataLakeSettings())
-    , write_format(configuration_->format)
+    , write_format(configuration_->getFormat())
 {
 }
 
diff --git a/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergWrites.cpp b/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergWrites.cpp
index 60aa4728d126..3809dfcd38c2 100644
--- a/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergWrites.cpp
+++ b/src/Storages/ObjectStorage/DataLakes/Iceberg/IcebergWrites.cpp
@@ -632,7 +632,7 @@ IcebergStorageSink::IcebergStorageSink(
     , table_id(table_id_)
     , persistent_table_components(persistent_table_components_)
     , data_lake_settings(configuration_->getDataLakeSettings())
-    , write_format(configuration_->format)
+    , write_format(configuration_->getFormat())
     , blob_storage_type_name(configuration_->getTypeName())
     , blob_storage_namespace_name(configuration_->getNamespace())
 {
diff --git a/src/Storages/ObjectStorage/HDFS/Configuration.cpp b/src/Storages/ObjectStorage/HDFS/Configuration.cpp
index 0273860e22f9..e19cf1f86523 100644
--- a/src/Storages/ObjectStorage/HDFS/Configuration.cpp
+++ b/src/Storages/ObjectStorage/HDFS/Configuration.cpp
@@ -235,6 +235,14 @@ void StorageHDFSConfiguration::addStructureAndFormatToArgsIfNeeded(
 {
     addStructureAndFormatToArgsIfNeededHDFS(args, structure_, format_, context, with_structure);
 }
+
+ASTPtr StorageHDFSConfiguration::createArgsWithAccessData() const
+{
+    auto arguments = make_intrusive<ASTExpressionList>();
+    arguments->children.push_back(make_intrusive<ASTLiteral>(url + path.path));
+    return arguments;
+}
+
 }
 
 #endif
diff --git a/src/Storages/ObjectStorage/HDFS/Configuration.h b/src/Storages/ObjectStorage/HDFS/Configuration.h
index 8730c5ad08a3..c55c4d0c3eab 100644
--- a/src/Storages/ObjectStorage/HDFS/Configuration.h
+++ b/src/Storages/ObjectStorage/HDFS/Configuration.h
@@ -80,6 +80,8 @@ class StorageHDFSConfiguration : public StorageObjectStorageConfiguration
     void addStructureAndFormatToArgsIfNeeded(
         ASTs & args, const String & structure_, const String & format_, ContextPtr context, bool with_structure) override;
 
+    ASTPtr createArgsWithAccessData() const override;
+
 private:
     void initializeFromParsedArguments(const HDFSStorageParsedArguments & parsed_arguments);
     void setURL(const std::string & url_);
diff --git a/src/Storages/ObjectStorage/ReadBufferIterator.cpp b/src/Storages/ObjectStorage/ReadBufferIterator.cpp
index 85c70b06a34a..1f11596b8f6a 100644
--- a/src/Storages/ObjectStorage/ReadBufferIterator.cpp
+++ b/src/Storages/ObjectStorage/ReadBufferIterator.cpp
@@ -39,8 +39,8 @@ ReadBufferIterator::ReadBufferIterator(
     , read_keys(read_keys_)
     , prev_read_keys_size(read_keys_.size())
 {
-    if (configuration->format != "auto")
-        format = configuration->format;
+    if (configuration->getFormat() != "auto")
+        format = configuration->getFormat();
 }
 
 SchemaCache::Key ReadBufferIterator::getKeyForSchemaCache(const ObjectInfo & object_info, const String & format_name) const
@@ -143,7 +143,7 @@ std::unique_ptr<ReadBuffer> ReadBufferIterator::recreateLastReadBuffer()
     auto impl
         = createReadBuffer(current_object_info->relative_path_with_metadata, object_storage, context, getLogger("ReadBufferIterator"));
 
-    const auto compression_method = chooseCompressionMethod(current_object_info->getFileName(), configuration->compression_method);
+    const auto compression_method = chooseCompressionMethod(current_object_info->getFileName(), configuration->getCompressionMethod());
     const auto zstd_window = static_cast<int>(context->getSettingsRef()[Setting::zstd_window_log_max]);
 
     return wrapReadBufferWithCompressionMethod(std::move(impl), compression_method, zstd_window);
@@ -259,13 +259,13 @@ ReadBufferIterator::Data ReadBufferIterator::next()
         using ObjectInfoInArchive = StorageObjectStorageSource::ArchiveIterator::ObjectInfoInArchive;
         if (const auto * object_info_in_archive = dynamic_cast<const ObjectInfoInArchive *>(current_object_info.get()))
         {
-            compression_method = chooseCompressionMethod(filename, configuration->compression_method);
+            compression_method = chooseCompressionMethod(filename, configuration->getCompressionMethod());
             const auto & archive_reader = object_info_in_archive->archive_reader;
             read_buf = archive_reader->readFile(object_info_in_archive->path_in_archive, /*throw_on_not_found=*/true);
         }
         else
         {
-            compression_method = chooseCompressionMethod(filename, configuration->compression_method);
+            compression_method = chooseCompressionMethod(filename, configuration->getCompressionMethod());
             read_buf = createReadBuffer(
                 current_object_info->relative_path_with_metadata, object_storage, getContext(), getLogger("ReadBufferIterator"));
         }
diff --git a/src/Storages/ObjectStorage/S3/Configuration.cpp b/src/Storages/ObjectStorage/S3/Configuration.cpp
index 15627f2845d1..2b7361d5ed48 100644
--- a/src/Storages/ObjectStorage/S3/Configuration.cpp
+++ b/src/Storages/ObjectStorage/S3/Configuration.cpp
@@ -103,6 +103,7 @@ static const std::unordered_set<std::string_view> optional_configuration_keys =
     "partition_strategy",
     "partition_columns_in_data_file",
     "storage_class_name",
+    "storage_type",
     /// Private configuration options
     "role_arn", /// for extra_credentials
     "role_session_name", /// for extra_credentials
@@ -620,6 +621,7 @@ void S3StorageParsedArguments::fromAST(ASTs & args, ContextPtr context, bool wit
         compression_method = compression_method_value.value();
     }
 
+
     if (auto partition_strategy_value = getFromPositionOrKeyValue<String>("partition_strategy", args, engine_args_to_idx, key_value_args);
         partition_strategy_value.has_value())
     {
@@ -1008,6 +1010,31 @@ void StorageS3Configuration::addStructureAndFormatToArgsIfNeeded(
     addStructureAndFormatToArgsIfNeededS3(
         args, structure_, format_, context, with_structure, S3StorageParsedArguments::getMaxNumberOfArguments(with_structure));
 }
+
+ASTPtr StorageS3Configuration::createArgsWithAccessData() const
+{
+    auto arguments = make_intrusive<ASTExpressionList>();
+
+    arguments->children.push_back(make_intrusive<ASTLiteral>(url.uri_str));
+    if (s3_settings->auth_settings[S3AuthSetting::no_sign_request])
+    {
+        arguments->children.push_back(make_intrusive<ASTLiteral>("NOSIGN"));
+    }
+    else
+    {
+        arguments->children.push_back(make_intrusive<ASTLiteral>(s3_settings->auth_settings[S3AuthSetting::access_key_id].value));
+        arguments->children.push_back(make_intrusive<ASTLiteral>(s3_settings->auth_settings[S3AuthSetting::secret_access_key].value));
+        if (!s3_settings->auth_settings[S3AuthSetting::session_token].value.empty())
+            arguments->children.push_back(make_intrusive<ASTLiteral>(s3_settings->auth_settings[S3AuthSetting::session_token].value));
+        if (getFormat() != "auto")
+            arguments->children.push_back(make_intrusive<ASTLiteral>(getFormat()));
+        if (!getCompressionMethod().empty())
+            arguments->children.push_back(make_intrusive<ASTLiteral>(getCompressionMethod()));
+    }
+
+    return arguments;
+}
+
 }
 
 #endif
diff --git a/src/Storages/ObjectStorage/S3/Configuration.h b/src/Storages/ObjectStorage/S3/Configuration.h
index ffd99ea7ec1f..2e238167516a 100644
--- a/src/Storages/ObjectStorage/S3/Configuration.h
+++ b/src/Storages/ObjectStorage/S3/Configuration.h
@@ -133,6 +133,8 @@ class StorageS3Configuration : public StorageObjectStorageConfiguration
         ContextPtr context,
         bool with_structure) override;
 
+    ASTPtr createArgsWithAccessData() const override;
+
     static bool collectCredentials(ASTPtr maybe_credentials, S3::S3AuthSettings & auth_settings_, ContextPtr local_context);
 
     S3::URI url;
diff --git a/src/Storages/ObjectStorage/StorageObjectStorage.cpp b/src/Storages/ObjectStorage/StorageObjectStorage.cpp
index 39aab0f30e06..18d2d6824411 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorage.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorage.cpp
@@ -65,6 +65,11 @@ String StorageObjectStorage::getPathSample(ContextPtr context)
     if (context->getSettingsRef()[Setting::use_hive_partitioning])
         local_distributed_processing = false;
 
+    const auto path = configuration->getRawPath();
+
+    if (!configuration->isArchive() && !path.hasGlobs() && !local_distributed_processing)
+        return path.path;
+
     auto file_iterator = StorageObjectStorageSource::createFileIterator(
         configuration,
         query_settings,
@@ -80,11 +85,6 @@ String StorageObjectStorage::getPathSample(ContextPtr context)
         {} // file_progress_callback
     );
 
-    const auto path = configuration->getRawPath();
-
-    if (!configuration->isArchive() && !path.hasGlobs() && !local_distributed_processing)
-        return path.path;
-
     if (auto file = file_iterator->next(0))
         return file->getPath();
     return "";
@@ -101,11 +101,11 @@ StorageObjectStorage::StorageObjectStorage(
     std::optional<FormatSettings> format_settings_,
     LoadingStrictnessLevel mode,
     std::shared_ptr<DataLake::ICatalog> catalog_,
-    bool if_not_exists_,
+    bool /*if_not_exists_*/,
     bool is_datalake_query,
     bool distributed_processing_,
     ASTPtr partition_by_,
-    ASTPtr order_by_,
+    ASTPtr /*order_by_*/,
     bool is_table_function,
     bool lazy_init)
     : IStorage(table_id_)
@@ -119,9 +119,9 @@ StorageObjectStorage::StorageObjectStorage(
 {
     configuration->initPartitionStrategy(partition_by_, columns_in_table_or_function_definition, context);
 
-    const bool need_resolve_columns_or_format = columns_in_table_or_function_definition.empty() || (configuration->format == "auto");
+    const bool need_resolve_columns_or_format = columns_in_table_or_function_definition.empty() || (configuration->getFormat() == "auto");
     const bool need_resolve_sample_path = context->getSettingsRef()[Setting::use_hive_partitioning]
-        && !configuration->partition_strategy
+        && !configuration->getPartitionStrategy()
         && !configuration->isDataLakeConfiguration();
     const bool do_lazy_init = lazy_init && !need_resolve_columns_or_format && !need_resolve_sample_path;
 
@@ -139,13 +139,6 @@ StorageObjectStorage::StorageObjectStorage(
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Delta lake CDF is allowed only for deltaLake table function");
     }
 
-    if (!is_table_function && !columns_in_table_or_function_definition.empty() && !is_datalake_query && mode == LoadingStrictnessLevel::CREATE)
-    {
-        LOG_DEBUG(log, "Creating new storage with specified columns");
-        configuration->create(
-            object_storage, context, columns_in_table_or_function_definition, partition_by_, order_by_, if_not_exists_, catalog, storage_id);
-    }
-
     bool updated_configuration = false;
     try
     {
@@ -179,7 +172,7 @@ StorageObjectStorage::StorageObjectStorage(
 
     ColumnsDescription columns{columns_in_table_or_function_definition};
     if (need_resolve_columns_or_format)
-        resolveSchemaAndFormat(columns, configuration->format, object_storage, configuration, format_settings, sample_path, context);
+        resolveSchemaAndFormat(columns, object_storage, configuration, format_settings, sample_path, context);
     else
         validateSupportedColumns(columns, *configuration);
 
@@ -187,7 +180,7 @@ StorageObjectStorage::StorageObjectStorage(
 
     /// FIXME: We need to call getPathSample() lazily on select
     /// in case it failed to be initialized in constructor.
-    if (updated_configuration && sample_path.empty() && need_resolve_sample_path && !configuration->partition_strategy)
+    if (updated_configuration && sample_path.empty() && need_resolve_sample_path && !configuration->getPartitionStrategy())
     {
         try
         {
@@ -219,7 +212,7 @@ StorageObjectStorage::StorageObjectStorage(
             sample_path);
     }
 
-    bool format_supports_prewhere = FormatFactory::instance().checkIfFormatSupportsPrewhere(configuration->format, context, format_settings);
+    bool format_supports_prewhere = FormatFactory::instance().checkIfFormatSupportsPrewhere(configuration->getFormat(), context, format_settings);
 
     /// TODO: Known problems with datalake prewhere:
     ///  * If the iceberg table went through schema evolution, columns read from file may need to
@@ -251,16 +244,16 @@ StorageObjectStorage::StorageObjectStorage(
     metadata.setComment(comment);
 
     /// I am not sure this is actually required, but just in case
-    if (configuration->partition_strategy)
+    if (configuration->getPartitionStrategy())
     {
-        metadata.partition_key = configuration->partition_strategy->getPartitionKeyDescription();
+        metadata.partition_key = configuration->getPartitionStrategy()->getPartitionKeyDescription();
     }
 
     setVirtuals(VirtualColumnUtils::getVirtualsForFileLikeStorage(
         metadata.columns,
         context,
         format_settings,
-        configuration->partition_strategy_type,
+        configuration->getPartitionStrategyType(),
         sample_path));
 
     setInMemoryMetadata(metadata);
@@ -282,17 +275,17 @@ String StorageObjectStorage::getName() const
 
 bool StorageObjectStorage::prefersLargeBlocks() const
 {
-    return FormatFactory::instance().checkIfOutputFormatPrefersLargeBlocks(configuration->format);
+    return FormatFactory::instance().checkIfOutputFormatPrefersLargeBlocks(configuration->getFormat());
 }
 
 bool StorageObjectStorage::parallelizeOutputAfterReading(ContextPtr context) const
 {
-    return FormatFactory::instance().checkParallelizeOutputAfterReading(configuration->format, context);
+    return FormatFactory::instance().checkParallelizeOutputAfterReading(configuration->getFormat(), context);
 }
 
 bool StorageObjectStorage::supportsSubsetOfColumns(const ContextPtr & context) const
 {
-    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->format, context, format_settings);
+    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->getFormat(), context, format_settings);
 }
 
 bool StorageObjectStorage::supportsPrewhere() const
@@ -380,7 +373,7 @@ void StorageObjectStorage::read(
             /* if_not_updated_before */ false);
     }
 
-    if (configuration->partition_strategy && configuration->partition_strategy_type != PartitionStrategyFactory::StrategyType::HIVE)
+    if (configuration->getPartitionStrategy() && configuration->getPartitionStrategyType() != PartitionStrategyFactory::StrategyType::HIVE)
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED,
                         "Reading from a partitioned {} storage is not implemented yet",
@@ -512,7 +505,7 @@ SinkToStoragePtr StorageObjectStorage::write(
 
     /// Not a data lake, just raw object storage
 
-    if (configuration->partition_strategy)
+    if (configuration->getPartitionStrategy())
     {
         return std::make_shared<PartitionedStorageObjectStorageSink>(object_storage, configuration, format_settings, sample_block, local_context);
     }
@@ -530,8 +523,8 @@ SinkToStoragePtr StorageObjectStorage::write(
         format_settings,
         sample_block,
         local_context,
-        configuration->format,
-        configuration->compression_method);
+        configuration->getFormat(),
+        configuration->getCompressionMethod());
 }
 
 bool StorageObjectStorage::optimize(
@@ -629,7 +622,7 @@ ColumnsDescription StorageObjectStorage::resolveSchemaFromData(
 {
     ObjectInfos read_keys;
     auto iterator = createReadBufferIterator(object_storage, configuration, format_settings, read_keys, context);
-    auto schema = readSchemaFromFormat(configuration->format, format_settings, *iterator, context);
+    auto schema = readSchemaFromFormat(configuration->getFormat(), format_settings, *iterator, context);
     sample_path = iterator->getLastFilePath();
     return schema;
 }
@@ -650,7 +643,7 @@ std::string StorageObjectStorage::resolveFormatFromData(
 
 std::pair<ColumnsDescription, std::string> StorageObjectStorage::resolveSchemaAndFormatFromData(
     const ObjectStoragePtr & object_storage,
-    const StorageObjectStorageConfigurationPtr & configuration,
+    StorageObjectStorageConfigurationPtr & configuration,
     const std::optional<FormatSettings> & format_settings,
     std::string & sample_path,
     const ContextPtr & context)
@@ -659,13 +652,13 @@ std::pair<ColumnsDescription, std::string> StorageObjectStorage::resolveSchemaAn
     auto iterator = createReadBufferIterator(object_storage, configuration, format_settings, read_keys, context);
     auto [columns, format] = detectFormatAndReadSchema(format_settings, *iterator, context);
     sample_path = iterator->getLastFilePath();
-    configuration->format = format;
+    configuration->setFormat(format);
     return std::pair(columns, format);
 }
 
 void StorageObjectStorage::addInferredEngineArgsToCreateQuery(ASTs & args, const ContextPtr & context) const
 {
-    configuration->addStructureAndFormatToArgsIfNeeded(args, "", configuration->format, context, /*with_structure=*/false);
+    configuration->addStructureAndFormatToArgsIfNeeded(args, "", configuration->getFormat(), context, /*with_structure=*/false);
 }
 
 SchemaCache & StorageObjectStorage::getSchemaCache(const ContextPtr & context, const std::string & storage_engine_name)
diff --git a/src/Storages/ObjectStorage/StorageObjectStorage.h b/src/Storages/ObjectStorage/StorageObjectStorage.h
index e65f6e3495d0..74e3c6c981fa 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorage.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorage.h
@@ -125,7 +125,7 @@ class StorageObjectStorage : public IStorage
 
     static std::pair<ColumnsDescription, std::string> resolveSchemaAndFormatFromData(
         const ObjectStoragePtr & object_storage,
-        const StorageObjectStorageConfigurationPtr & configuration,
+        StorageObjectStorageConfigurationPtr & configuration,
         const std::optional<FormatSettings> & format_settings,
         std::string & sample_path,
         const ContextPtr & context);
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 4611aa7cb271..329dd39f56e9 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -8,9 +8,16 @@
 
 #include <Core/Settings.h>
 #include <Formats/FormatFactory.h>
+#include <Parsers/ASTSelectQuery.h>
+#include <Parsers/ASTTablesInSelectQuery.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
+#include <Parsers/ASTFunction.h>
 #include <Processors/Sources/RemoteSource.h>
 #include <QueryPipeline/RemoteQueryExecutor.h>
 #include <Storages/IPartitionStrategy.h>
+#include <TableFunctions/TableFunctionFactory.h>
+#include <Interpreters/ClusterProxy/SelectStreamFactory.h>
 
 #include <Storages/VirtualColumnUtils.h>
 #include <Storages/HivePartitioningUtils.h>
@@ -26,6 +33,8 @@ namespace Setting
     extern const SettingsBool use_hive_partitioning;
     extern const SettingsBool cluster_function_process_archive_on_multiple_nodes;
     extern const SettingsObjectStorageGranularityLevel cluster_table_function_split_granularity;
+    extern const SettingsBool parallel_replicas_for_cluster_engines;
+    extern const SettingsString object_storage_cluster;
 }
 
 namespace ErrorCodes
@@ -38,6 +47,14 @@ String StorageObjectStorageCluster::getPathSample(ContextPtr context)
     auto query_settings = configuration->getQuerySettings(context);
     /// We don't want to throw an exception if there are no files with specified path.
     query_settings.throw_on_zero_files_match = false;
+
+    if (!configuration->isArchive())
+    {
+        const auto & path = configuration->getPathForRead();
+        if (!path.hasGlobs())
+            return path.path;
+    }
+
     auto file_iterator = StorageObjectStorageSource::createFileIterator(
         configuration,
         query_settings,
@@ -50,11 +67,14 @@ String StorageObjectStorageCluster::getPathSample(ContextPtr context)
         {}, // virtual_columns
         {}, // hive_columns
         nullptr, // read_keys
-        {} // file_progress_callback
+        {}, // file_progress_callback
+        false, // ignore_archive_globs
+        true // skip_object_metadata
     );
 
     if (auto file = file_iterator->next(0))
         return file->getPath();
+
     return "";
 }
 
@@ -66,21 +86,52 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
     const ColumnsDescription & columns_in_table_or_function_definition,
     const ConstraintsDescription & constraints_,
     const ASTPtr & partition_by,
+    const ASTPtr & order_by,
     ContextPtr context_,
-    bool is_table_function)
+    const String & comment_,
+    std::optional<FormatSettings> format_settings_,
+    LoadingStrictnessLevel mode_,
+    std::shared_ptr<DataLake::ICatalog> catalog,
+    bool if_not_exists,
+    bool is_datalake_query,
+    bool is_table_function,
+    bool lazy_init)
     : IStorageCluster(
         cluster_name_, table_id_, getLogger(fmt::format("{}({})", configuration_->getEngineName(), table_id_.table_name)))
     , configuration{configuration_}
     , object_storage(object_storage_)
+    , cluster_name_in_settings(false)
 {
     configuration->initPartitionStrategy(partition_by, columns_in_table_or_function_definition, context_);
-    /// We allow exceptions to be thrown on update(),
-    /// because Cluster engine can only be used as table function,
-    /// so no lazy initialization is allowed.
-    configuration->update(
-        object_storage,
-        context_,
-        /* if_not_updated_before */ false);
+
+    const bool need_resolve_columns_or_format = columns_in_table_or_function_definition.empty() || (configuration->getFormat() == "auto");
+    const bool do_lazy_init = lazy_init && !need_resolve_columns_or_format;
+
+    auto log_ = getLogger("StorageObjectStorageCluster");
+
+    try
+    {
+        if (!do_lazy_init)
+        {
+            /// We allow exceptions to be thrown on update(),
+            /// because Cluster engine can only be used as table function,
+            /// so no lazy initialization is allowed.
+            configuration->update(
+                object_storage,
+                context_,
+                /* if_not_updated_before */false);
+        }
+    }
+    catch (...)
+    {
+        // If we don't have format or schema yet, we can't ignore failed configuration update,
+        // because relevant configuration is crucial for format and schema inference
+        if (mode_ <= LoadingStrictnessLevel::CREATE || need_resolve_columns_or_format)
+        {
+            throw;
+        }
+        tryLogCurrentException(log_);
+    }
 
     // For tables need to update configuration on each read
     // because data can be changed after previous update
@@ -88,13 +139,16 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
 
     ColumnsDescription columns{columns_in_table_or_function_definition};
     std::string sample_path;
-    resolveSchemaAndFormat(columns, configuration->format, object_storage, configuration, {}, sample_path, context_);
+    if (need_resolve_columns_or_format)
+        resolveSchemaAndFormat(columns, object_storage, configuration, {}, sample_path, context_);
+    else
+        validateSupportedColumns(columns, *configuration);
     configuration->check(context_);
 
     if (sample_path.empty()
         && context_->getSettingsRef()[Setting::use_hive_partitioning]
         && !configuration->isDataLakeConfiguration()
-        && !configuration->partition_strategy)
+        && !configuration->getPartitionStrategy())
         sample_path = getPathSample(context_);
 
     /// Not grabbing the file_columns because it is not necessary to do it here.
@@ -114,7 +168,7 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
         metadata.columns,
         context_,
         /* format_settings */std::nullopt,
-        configuration->partition_strategy_type,
+        configuration->getPartitionStrategyType(),
         sample_path));
 
     setInMemoryMetadata(metadata);
@@ -126,6 +180,39 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
         auto metadata_snapshot = configuration->getStorageSnapshotMetadata(context_);
         setInMemoryMetadata(metadata_snapshot);
     }
+
+    const auto can_use_parallel_replicas = !cluster_name_.empty()
+        && context_->getSettingsRef()[Setting::parallel_replicas_for_cluster_engines]
+        && context_->canUseTaskBasedParallelReplicas()
+        && !context_->isDistributed();
+
+    bool can_use_distributed_iterator =
+        context_->getClientInfo().collaborate_with_initiator &&
+        can_use_parallel_replicas;
+
+    pure_storage = std::make_shared<StorageObjectStorage>(
+        configuration,
+        object_storage,
+        context_,
+        getStorageID(),
+        IStorageCluster::getInMemoryMetadata().getColumns(),
+        IStorageCluster::getInMemoryMetadata().getConstraints(),
+        comment_,
+        format_settings_,
+        mode_,
+        catalog,
+        if_not_exists,
+        is_datalake_query,
+        /* distributed_processing */can_use_distributed_iterator,
+        partition_by,
+        order_by,
+        /* is_table_function */false,
+        /* lazy_init */lazy_init);
+
+    auto virtuals_ = getVirtualsPtr();
+    if (virtuals_)
+        pure_storage->setVirtuals(*virtuals_);
+    pure_storage->setInMemoryMetadata(IStorageCluster::getInMemoryMetadata());
 }
 
 std::string StorageObjectStorageCluster::getName() const
@@ -135,6 +222,8 @@ std::string StorageObjectStorageCluster::getName() const
 
 std::optional<UInt64> StorageObjectStorageCluster::totalRows(ContextPtr query_context) const
 {
+    if (pure_storage)
+        return pure_storage->totalRows(query_context);
     configuration->update(
         object_storage,
         query_context,
@@ -144,6 +233,8 @@ std::optional<UInt64> StorageObjectStorageCluster::totalRows(ContextPtr query_co
 
 std::optional<UInt64> StorageObjectStorageCluster::totalBytes(ContextPtr query_context) const
 {
+    if (pure_storage)
+        return pure_storage->totalBytes(query_context);
     configuration->update(
         object_storage,
         query_context,
@@ -151,11 +242,135 @@ std::optional<UInt64> StorageObjectStorageCluster::totalBytes(ContextPtr query_c
     return configuration->totalBytes(query_context);
 }
 
+void StorageObjectStorageCluster::updateQueryForDistributedEngineIfNeeded(ASTPtr & query, ContextPtr context)
+{
+    // Change table engine on table function for distributed request
+    // CREATE TABLE t (...) ENGINE=IcebergS3(...)
+    // SELECT * FROM t
+    // change on
+    // SELECT * FROM icebergS3(...)
+    // to execute on cluster nodes
+
+    auto * select_query = query->as<ASTSelectQuery>();
+    if (!select_query || !select_query->tables())
+        return;
+
+    auto * tables = select_query->tables()->as<ASTTablesInSelectQuery>();
+
+    if (tables->children.empty())
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Expected SELECT query from table with engine {}, got '{}'",
+            configuration->getEngineName(), query->formatForLogging());
+
+    auto * table_expression = tables->children[0]->as<ASTTablesInSelectQueryElement>()->table_expression->as<ASTTableExpression>();
+
+    if (!table_expression)
+        return;
+
+    if (!table_expression->database_and_table_name)
+        return;
+
+    auto & table_identifier_typed = table_expression->database_and_table_name->as<ASTTableIdentifier &>();
+
+    auto table_alias = table_identifier_typed.tryGetAlias();
+
+    auto storage_engine_name = configuration->getEngineName();
+    if (storage_engine_name == "Iceberg")
+    {
+        switch (configuration->getType())
+        {
+            case ObjectStorageType::S3:
+                storage_engine_name = "IcebergS3";
+                break;
+            case ObjectStorageType::Azure:
+                storage_engine_name = "IcebergAzure";
+                break;
+            case ObjectStorageType::HDFS:
+                storage_engine_name = "IcebergHDFS";
+                break;
+            default:
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "Can't find table function for engine {}",
+                    storage_engine_name
+                );
+        }
+    }
+
+    static std::unordered_map<std::string, std::string> engine_to_function = {
+        {"S3", "s3"},
+        {"Azure", "azureBlobStorage"},
+        {"HDFS", "hdfs"},
+        {"Iceberg", "iceberg"},
+        {"IcebergS3", "icebergS3"},
+        {"IcebergAzure", "icebergAzure"},
+        {"IcebergHDFS", "icebergHDFS"},
+        {"DeltaLake", "deltaLake"},
+        {"DeltaLakeS3", "deltaLakeS3"},
+        {"DeltaLakeAzure", "deltaLakeAzure"},
+        {"Hudi", "hudi"}
+    };
+
+    auto p = engine_to_function.find(storage_engine_name);
+    if (p == engine_to_function.end())
+    {
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Can't find table function for engine {}",
+            storage_engine_name
+        );
+    }
+
+    std::string table_function_name = p->second;
+
+    auto function_ast = make_intrusive<ASTFunction>();
+    function_ast->name = table_function_name;
+
+    auto cluster_name = getClusterName(context);
+
+    if (cluster_name.empty())
+    {
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Can't be here without cluster name, no cluster name in query {}",
+            query->formatForLogging());
+    }
+
+    function_ast->arguments = configuration->createArgsWithAccessData();
+    function_ast->children.push_back(function_ast->arguments);
+    function_ast->setAlias(table_alias);
+
+    ASTPtr function_ast_ptr(function_ast);
+
+    table_expression->database_and_table_name = nullptr;
+    table_expression->table_function = function_ast_ptr;
+    table_expression->children[0] = function_ast_ptr;
+
+    auto settings = select_query->settings();
+    if (settings)
+    {
+        auto & settings_ast = settings->as<ASTSetQuery &>();
+        settings_ast.changes.insertSetting("object_storage_cluster", cluster_name);
+    }
+    else
+    {
+        auto settings_ast_ptr = make_intrusive<ASTSetQuery>();
+        settings_ast_ptr->is_standalone = false;
+        settings_ast_ptr->changes.setSetting("object_storage_cluster", cluster_name);
+        select_query->setExpression(ASTSelectQuery::Expression::SETTINGS, std::move(settings_ast_ptr));
+    }
+
+    cluster_name_in_settings = true;
+}
+
 void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
     ASTPtr & query,
     const DB::StorageSnapshotPtr & storage_snapshot,
     const ContextPtr & context)
 {
+    updateQueryForDistributedEngineIfNeeded(query, context);
+
     auto * table_function = extractTableFunctionFromSelectQuery(query);
     if (!table_function)
         return;
@@ -178,6 +393,8 @@ void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
             configuration->getEngineName());
     }
 
+    ASTPtr object_storage_type_arg;
+    configuration->extractDynamicStorageType(args, context, &object_storage_type_arg);
     ASTPtr settings_temporary_storage = nullptr;
     for (auto it = args.begin(); it != args.end(); ++it)
     {
@@ -190,23 +407,79 @@ void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
         }
     }
 
-    if (!endsWith(table_function->name, "Cluster"))
-        configuration->addStructureAndFormatToArgsIfNeeded(args, structure, configuration->format, context, /*with_structure=*/true);
+    if (cluster_name_in_settings || !endsWith(table_function->name, "Cluster"))
+    {
+        configuration->addStructureAndFormatToArgsIfNeeded(args, structure, configuration->getFormat(), context, /*with_structure=*/true);
+
+        /// Convert to old-stype *Cluster table function.
+        /// This allows to use old clickhouse versions in cluster.
+        static std::unordered_map<std::string, std::string> function_to_cluster_function = {
+            {"s3", "s3Cluster"},
+            {"azureBlobStorage", "azureBlobStorageCluster"},
+            {"hdfs", "hdfsCluster"},
+            {"iceberg", "icebergCluster"},
+            {"icebergS3", "icebergS3Cluster"},
+            {"icebergAzure", "icebergAzureCluster"},
+            {"icebergHDFS", "icebergHDFSCluster"},
+            {"deltaLake", "deltaLakeCluster"},
+            {"deltaLakeS3", "deltaLakeS3Cluster"},
+            {"deltaLakeAzure", "deltaLakeAzureCluster"},
+            {"hudi", "hudiCluster"},
+        };
+
+        auto p = function_to_cluster_function.find(table_function->name);
+        if (p == function_to_cluster_function.end())
+        {
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Can't find cluster name for table function {}",
+                table_function->name);
+        }
+
+        table_function->name = p->second;
+
+        auto cluster_name = getClusterName(context);
+        auto cluster_name_arg = make_intrusive<ASTLiteral>(cluster_name);
+        args.insert(args.begin(), cluster_name_arg);
+
+        auto * select_query = query->as<ASTSelectQuery>();
+        if (!select_query)
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Expected SELECT query from table function {}",
+                configuration->getEngineName());
+
+        auto settings = select_query->settings();
+        if (settings)
+        {
+            auto & settings_ast = settings->as<ASTSetQuery &>();
+            if (settings_ast.changes.removeSetting("object_storage_cluster") && settings_ast.changes.empty())
+            {
+                select_query->setExpression(ASTSelectQuery::Expression::SETTINGS, {});
+            }
+            /// No throw if not found - `object_storage_cluster` can be global setting.
+        }
+    }
     else
     {
         ASTPtr cluster_name_arg = args.front();
         args.erase(args.begin());
-        configuration->addStructureAndFormatToArgsIfNeeded(args, structure, configuration->format, context, /*with_structure=*/true);
+        configuration->addStructureAndFormatToArgsIfNeeded(args, structure, configuration->getFormat(), context, /*with_structure=*/true);
         args.insert(args.begin(), cluster_name_arg);
     }
     if (settings_temporary_storage)
     {
         args.insert(args.end(), std::move(settings_temporary_storage));
     }
+    if (object_storage_type_arg)
+        args.insert(args.end(), object_storage_type_arg);
 }
 
 void StorageObjectStorageCluster::updateExternalDynamicMetadataIfExists(ContextPtr query_context)
 {
+    if (getClusterName(query_context).empty())
+        return pure_storage->updateExternalDynamicMetadataIfExists(query_context);
+
     configuration->update(
         object_storage,
         query_context,
@@ -245,7 +518,7 @@ RemoteQueryExecutor::Extension StorageObjectStorageCluster::getTaskIteratorExten
     {
         iterator = std::make_shared<ObjectIteratorSplitByBuckets>(
             std::move(iterator),
-            configuration->format,
+            configuration->getFormat(),
             object_storage,
             local_context
         );
@@ -292,4 +565,318 @@ void StorageObjectStorageCluster::updateConfigurationIfNeeded(ContextPtr context
     }
 }
 
+void StorageObjectStorageCluster::readFallBackToPure(
+    QueryPlan & query_plan,
+    const Names & column_names,
+    const StorageSnapshotPtr & storage_snapshot,
+    SelectQueryInfo & query_info,
+    ContextPtr context,
+    QueryProcessingStage::Enum processed_stage,
+    size_t max_block_size,
+    size_t num_streams)
+{
+    pure_storage->read(query_plan, column_names, storage_snapshot, query_info, context, processed_stage, max_block_size, num_streams);
+}
+
+SinkToStoragePtr StorageObjectStorageCluster::writeFallBackToPure(
+    const ASTPtr & query,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr context,
+    bool async_insert)
+{
+    return pure_storage->write(query, metadata_snapshot, context, async_insert);
+}
+
+String StorageObjectStorageCluster::getClusterName(ContextPtr context) const
+{
+    /// StorageObjectStorageCluster is always created for cluster or non-cluster variants.
+    /// User can specify cluster name in table definition or in setting `object_storage_cluster`
+    /// only for several queries. When it specified in both places, priority is given to the query setting.
+    /// When it is empty, non-cluster realization is used.
+    auto cluster_name_from_settings = context->getSettingsRef()[Setting::object_storage_cluster].value;
+    if (cluster_name_from_settings.empty())
+        cluster_name_from_settings = getOriginalClusterName();
+    return cluster_name_from_settings;
+}
+
+QueryProcessingStage::Enum StorageObjectStorageCluster::getQueryProcessingStage(
+    ContextPtr context, QueryProcessingStage::Enum to_stage, const StorageSnapshotPtr & storage_snapshot, SelectQueryInfo & query_info) const
+{
+    /// Full query if fall back to pure storage.
+    if (getClusterName(context).empty())
+        return QueryProcessingStage::Enum::FetchColumns;
+
+    /// Distributed storage.
+    return IStorageCluster::getQueryProcessingStage(context, to_stage, storage_snapshot, query_info);
+}
+
+std::optional<QueryPipeline> StorageObjectStorageCluster::distributedWrite(
+    const ASTInsertQuery & query,
+    ContextPtr context)
+{
+    if (getClusterName(context).empty())
+        return pure_storage->distributedWrite(query, context);
+    return IStorageCluster::distributedWrite(query, context);
+}
+
+void StorageObjectStorageCluster::drop()
+{
+    if (pure_storage)
+    {
+        pure_storage->drop();
+        return;
+    }
+    IStorageCluster::drop();
+}
+
+void StorageObjectStorageCluster::dropInnerTableIfAny(bool sync, ContextPtr context)
+{
+    if (getClusterName(context).empty())
+    {
+        pure_storage->dropInnerTableIfAny(sync, context);
+        return;
+    }
+    IStorageCluster::dropInnerTableIfAny(sync, context);
+}
+
+void StorageObjectStorageCluster::truncate(
+    const ASTPtr & query,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr local_context,
+    TableExclusiveLockHolder & lock_holder)
+{
+    /// Full query if fall back to pure storage.
+    if (getClusterName(local_context).empty())
+    {
+        pure_storage->truncate(query, metadata_snapshot, local_context, lock_holder);
+        return;
+    }
+
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Truncate is not supported by storage {}", getName());
+}
+
+void StorageObjectStorageCluster::checkTableCanBeRenamed(const StorageID & new_name) const
+{
+    if (pure_storage)
+    {
+        pure_storage->checkTableCanBeRenamed(new_name);
+        return;
+    }
+    IStorageCluster::checkTableCanBeRenamed(new_name);
+}
+
+void StorageObjectStorageCluster::rename(const String & new_path_to_table_data, const StorageID & new_table_id)
+{
+    if (pure_storage)
+    {
+        pure_storage->rename(new_path_to_table_data, new_table_id);
+        return;
+    }
+    IStorageCluster::rename(new_path_to_table_data, new_table_id);
+}
+
+void StorageObjectStorageCluster::renameInMemory(const StorageID & new_table_id)
+{
+    if (pure_storage)
+    {
+        pure_storage->renameInMemory(new_table_id);
+        return;
+    }
+    IStorageCluster::renameInMemory(new_table_id);
+}
+
+void StorageObjectStorageCluster::alter(const AlterCommands & params, ContextPtr context, AlterLockHolder & alter_lock_holder)
+{
+    if (getClusterName(context).empty())
+    {
+        pure_storage->alter(params, context, alter_lock_holder);
+        setInMemoryMetadata(pure_storage->getInMemoryMetadata());
+        return;
+    }
+    IStorageCluster::alter(params, context, alter_lock_holder);
+    pure_storage->setInMemoryMetadata(IStorageCluster::getInMemoryMetadata());
+}
+
+void StorageObjectStorageCluster::addInferredEngineArgsToCreateQuery(ASTs & args, const ContextPtr & context) const
+{
+    configuration->addStructureAndFormatToArgsIfNeeded(args, "", configuration->getFormat(), context, /*with_structure=*/false);
+}
+
+StorageMetadataPtr StorageObjectStorageCluster::getInMemoryMetadataPtr(bool bypass_metadata_cache) const
+{
+    if (pure_storage)
+        return pure_storage->getInMemoryMetadataPtr(bypass_metadata_cache);
+    return IStorageCluster::getInMemoryMetadataPtr(bypass_metadata_cache);
+}
+
+IDataLakeMetadata * StorageObjectStorageCluster::getExternalMetadata(ContextPtr query_context)
+{
+    if (getClusterName(query_context).empty())
+        return pure_storage->getExternalMetadata(query_context);
+
+    configuration->update(
+        object_storage,
+        query_context,
+        /* if_not_updated_before */false);
+
+    return configuration->getExternalMetadata();
+}
+
+void StorageObjectStorageCluster::checkAlterIsPossible(const AlterCommands & commands, ContextPtr context) const
+{
+    if (getClusterName(context).empty())
+    {
+        pure_storage->checkAlterIsPossible(commands, context);
+        return;
+    }
+    IStorageCluster::checkAlterIsPossible(commands, context);
+}
+
+void StorageObjectStorageCluster::checkMutationIsPossible(const MutationCommands & commands, const Settings & settings) const
+{
+    if (pure_storage)
+    {
+        pure_storage->checkMutationIsPossible(commands, settings);
+        return;
+    }
+    IStorageCluster::checkMutationIsPossible(commands, settings);
+}
+
+Pipe StorageObjectStorageCluster::alterPartition(
+    const StorageMetadataPtr & metadata_snapshot,
+    const PartitionCommands & commands,
+    ContextPtr context)
+{
+    if (getClusterName(context).empty())
+        return pure_storage->alterPartition(metadata_snapshot, commands, context);
+    return IStorageCluster::alterPartition(metadata_snapshot, commands, context);
+}
+
+void StorageObjectStorageCluster::checkAlterPartitionIsPossible(
+    const PartitionCommands & commands,
+    const StorageMetadataPtr & metadata_snapshot,
+    const Settings & settings,
+    ContextPtr context) const
+{
+    if (getClusterName(context).empty())
+    {
+        pure_storage->checkAlterPartitionIsPossible(commands, metadata_snapshot, settings, context);
+        return;
+    }
+    IStorageCluster::checkAlterPartitionIsPossible(commands, metadata_snapshot, settings, context);
+}
+
+bool StorageObjectStorageCluster::optimize(
+    const ASTPtr & query,
+    const StorageMetadataPtr & metadata_snapshot,
+    const ASTPtr & partition,
+    bool final,
+    bool deduplicate,
+    const Names & deduplicate_by_columns,
+    bool cleanup,
+    ContextPtr context)
+{
+    if (getClusterName(context).empty())
+        return pure_storage->optimize(query, metadata_snapshot, partition, final, deduplicate, deduplicate_by_columns, cleanup, context);
+    return IStorageCluster::optimize(query, metadata_snapshot, partition, final, deduplicate, deduplicate_by_columns, cleanup, context);
+}
+
+QueryPipeline StorageObjectStorageCluster::updateLightweight(const MutationCommands & commands, ContextPtr context)
+{
+    if (getClusterName(context).empty())
+        return pure_storage->updateLightweight(commands, context);
+    return IStorageCluster::updateLightweight(commands, context);
+}
+
+void StorageObjectStorageCluster::mutate(const MutationCommands & commands, ContextPtr context)
+{
+    if (getClusterName(context).empty())
+    {
+        pure_storage->mutate(commands, context);
+        return;
+    }
+    IStorageCluster::mutate(commands, context);
+}
+
+CancellationCode StorageObjectStorageCluster::killMutation(const String & mutation_id)
+{
+    if (pure_storage)
+        return pure_storage->killMutation(mutation_id);
+    return IStorageCluster::killMutation(mutation_id);
+}
+
+void StorageObjectStorageCluster::waitForMutation(const String & mutation_id, bool wait_for_another_mutation)
+{
+    if (pure_storage)
+    {
+        pure_storage->waitForMutation(mutation_id, wait_for_another_mutation);
+        return;
+    }
+    IStorageCluster::waitForMutation(mutation_id, wait_for_another_mutation);
+}
+
+void StorageObjectStorageCluster::setMutationCSN(const String & mutation_id, UInt64 csn)
+{
+    if (pure_storage)
+    {
+        pure_storage->setMutationCSN(mutation_id, csn);
+        return;
+    }
+    IStorageCluster::setMutationCSN(mutation_id, csn);
+}
+
+CancellationCode StorageObjectStorageCluster::killPartMoveToShard(const UUID & task_uuid)
+{
+    if (pure_storage)
+        return pure_storage->killPartMoveToShard(task_uuid);
+    return IStorageCluster::killPartMoveToShard(task_uuid);
+}
+
+void StorageObjectStorageCluster::startup()
+{
+    if (pure_storage)
+    {
+        pure_storage->startup();
+        return;
+    }
+    IStorageCluster::startup();
+}
+
+void StorageObjectStorageCluster::shutdown(bool is_drop)
+{
+    if (pure_storage)
+    {
+        pure_storage->shutdown(is_drop);
+        return;
+    }
+    IStorageCluster::shutdown(is_drop);
+}
+
+void StorageObjectStorageCluster::flushAndPrepareForShutdown()
+{
+    if (pure_storage)
+    {
+        pure_storage->flushAndPrepareForShutdown();
+        return;
+    }
+    IStorageCluster::flushAndPrepareForShutdown();
+}
+
+ActionLock StorageObjectStorageCluster::getActionLock(StorageActionBlockType action_type)
+{
+    if (pure_storage)
+        return pure_storage->getActionLock(action_type);
+    return IStorageCluster::getActionLock(action_type);
+}
+
+void StorageObjectStorageCluster::onActionLockRemove(StorageActionBlockType action_type)
+{
+    if (pure_storage)
+    {
+        pure_storage->onActionLockRemove(action_type);
+        return;
+    }
+    IStorageCluster::onActionLockRemove(action_type);
+}
+
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
index 45509cbf09a3..10ab3af0b69e 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
@@ -18,8 +18,16 @@ class StorageObjectStorageCluster : public IStorageCluster
         const ColumnsDescription & columns_in_table_or_function_definition,
         const ConstraintsDescription & constraints_,
         const ASTPtr & partition_by,
+        const ASTPtr & order_by,
         ContextPtr context_,
-        bool is_table_function_ = false);
+        const String & comment_,
+        std::optional<FormatSettings> format_settings_,
+        LoadingStrictnessLevel mode_,
+        std::shared_ptr<DataLake::ICatalog> catalog,
+        bool if_not_exists,
+        bool is_datalake_query,
+        bool is_table_function_ = false,
+        bool lazy_init = false);
 
     std::string getName() const override;
 
@@ -34,6 +42,86 @@ class StorageObjectStorageCluster : public IStorageCluster
 
     std::optional<UInt64> totalRows(ContextPtr query_context) const override;
     std::optional<UInt64> totalBytes(ContextPtr query_context) const override;
+    void setClusterNameInSettings(bool cluster_name_in_settings_) { cluster_name_in_settings = cluster_name_in_settings_; }
+
+    String getClusterName(ContextPtr context) const override;
+
+    QueryProcessingStage::Enum getQueryProcessingStage(ContextPtr, QueryProcessingStage::Enum, const StorageSnapshotPtr &, SelectQueryInfo &) const override;
+
+    std::optional<QueryPipeline> distributedWrite(
+        const ASTInsertQuery & query,
+        ContextPtr context) override;
+
+    void drop() override;
+
+    void dropInnerTableIfAny(bool sync, ContextPtr context) override;
+
+    void truncate(
+        const ASTPtr & query,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr local_context,
+        TableExclusiveLockHolder &) override;
+
+    void checkTableCanBeRenamed(const StorageID & new_name) const override;
+
+    void rename(const String & new_path_to_table_data, const StorageID & new_table_id) override;
+
+    void renameInMemory(const StorageID & new_table_id) override;
+
+    void alter(const AlterCommands & params, ContextPtr context, AlterLockHolder & alter_lock_holder) override;
+
+    void addInferredEngineArgsToCreateQuery(ASTs & args, const ContextPtr & context) const override;
+
+    IDataLakeMetadata * getExternalMetadata(ContextPtr query_context);
+
+    StorageMetadataPtr getInMemoryMetadataPtr(bool bypass_metadata_cache) const override;
+
+    void checkAlterIsPossible(const AlterCommands & commands, ContextPtr context) const override;
+
+    void checkMutationIsPossible(const MutationCommands & commands, const Settings & settings) const override;
+
+    Pipe alterPartition(
+        const StorageMetadataPtr & metadata_snapshot,
+        const PartitionCommands & commands,
+        ContextPtr context) override;
+
+    void checkAlterPartitionIsPossible(
+        const PartitionCommands & commands,
+        const StorageMetadataPtr & metadata_snapshot,
+        const Settings & settings,
+        ContextPtr context) const override;
+
+    bool optimize(
+        const ASTPtr & query,
+        const StorageMetadataPtr & metadata_snapshot,
+        const ASTPtr & partition,
+        bool final,
+        bool deduplicate,
+        const Names & deduplicate_by_columns,
+        bool cleanup,
+        ContextPtr context) override;
+
+    QueryPipeline updateLightweight(const MutationCommands & commands, ContextPtr context) override;
+
+    void mutate(const MutationCommands & commands, ContextPtr context) override;
+
+    CancellationCode killMutation(const String & mutation_id) override;
+
+    void waitForMutation(const String & mutation_id, bool wait_for_another_mutation) override;
+
+    void setMutationCSN(const String & mutation_id, UInt64 csn) override;
+
+    CancellationCode killPartMoveToShard(const UUID & task_uuid) override;
+
+    void startup() override;
+
+    void shutdown(bool is_drop = false) override;
+
+    void flushAndPrepareForShutdown() override;
+
+    ActionLock getActionLock(StorageActionBlockType action_type) override;
+
+    void onActionLockRemove(StorageActionBlockType action_type) override;
 
     void updateExternalDynamicMetadataIfExists(ContextPtr query_context) override;
 
@@ -45,12 +133,46 @@ class StorageObjectStorageCluster : public IStorageCluster
 
     void updateConfigurationIfNeeded(ContextPtr context) override;
 
+    void readFallBackToPure(
+        QueryPlan & query_plan,
+        const Names & column_names,
+        const StorageSnapshotPtr & storage_snapshot,
+        SelectQueryInfo & query_info,
+        ContextPtr context,
+        QueryProcessingStage::Enum processed_stage,
+        size_t max_block_size,
+        size_t num_streams) override;
+
+    SinkToStoragePtr writeFallBackToPure(
+        const ASTPtr & query,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr context,
+        bool async_insert) override;
+
+    /*
+    In case the table was created with `object_storage_cluster` setting,
+    modify the AST query object so that it uses the table function implementation
+    by mapping the engine name to table function name and setting `object_storage_cluster`.
+    For table like
+    CREATE TABLE table ENGINE=S3(...) SETTINGS object_storage_cluster='cluster'
+    coverts request
+    SELECT * FROM table
+    to
+    SELECT * FROM s3(...) SETTINGS object_storage_cluster='cluster'
+    to make distributed request over cluster 'cluster'.
+    */
+    void updateQueryForDistributedEngineIfNeeded(ASTPtr & query, ContextPtr context);
+
     const String engine_name;
-    const StorageObjectStorageConfigurationPtr configuration;
+    StorageObjectStorageConfigurationPtr configuration;
     const ObjectStoragePtr object_storage;
     NamesAndTypesList virtual_columns;
     NamesAndTypesList hive_partition_columns_to_read_from_file_path;
     bool update_configuration_on_read_write;
+    bool cluster_name_in_settings;
+
+    /// non-clustered storage to fall back on pure realisation if needed
+    std::shared_ptr<StorageObjectStorage> pure_storage;
 };
 
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.cpp b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.cpp
index a5e3b0e992d9..09f798c7005b 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.cpp
@@ -69,69 +69,68 @@ StorageInMemoryMetadata StorageObjectStorageConfiguration::getStorageSnapshotMet
 
 
 void StorageObjectStorageConfiguration::initialize(
-    StorageObjectStorageConfiguration & configuration_to_initialize,
     ASTs & engine_args,
     ContextPtr local_context,
     bool with_table_structure)
 {
     std::string disk_name;
-    if (configuration_to_initialize.isDataLakeConfiguration())
+    if (isDataLakeConfiguration())
     {
-        const auto & storage_settings = configuration_to_initialize.getDataLakeSettings();
+        const auto & storage_settings = getDataLakeSettings();
         disk_name = storage_settings[DataLakeStorageSetting::disk].changed
             ? storage_settings[DataLakeStorageSetting::disk].value
             : "";
     }
     if (!disk_name.empty())
-        configuration_to_initialize.fromDisk(disk_name, engine_args, local_context, with_table_structure);
+        fromDisk(disk_name, engine_args, local_context, with_table_structure);
     else if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, local_context))
-        configuration_to_initialize.fromNamedCollection(*named_collection, local_context);
+        fromNamedCollection(*named_collection, local_context);
     else
-        configuration_to_initialize.fromAST(engine_args, local_context, with_table_structure);
+        fromAST(engine_args, local_context, with_table_structure);
 
-    if (configuration_to_initialize.isNamespaceWithGlobs())
+    if (isNamespaceWithGlobs())
         throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                        "Expression can not have wildcards inside {} name", configuration_to_initialize.getNamespaceType());
+                        "Expression can not have wildcards inside {} name", getNamespaceType());
 
-    if (configuration_to_initialize.isDataLakeConfiguration())
+    if (isDataLakeConfiguration())
     {
-        if (configuration_to_initialize.partition_strategy_type != PartitionStrategyFactory::StrategyType::NONE)
+        if (getPartitionStrategyType() != PartitionStrategyFactory::StrategyType::NONE)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "The `partition_strategy` argument is incompatible with data lakes");
         }
     }
-    else if (configuration_to_initialize.partition_strategy_type == PartitionStrategyFactory::StrategyType::NONE)
+    else if (getPartitionStrategyType() == PartitionStrategyFactory::StrategyType::NONE)
     {
-        if (configuration_to_initialize.getRawPath().hasPartitionWildcard())
+        if (getRawPath().hasPartitionWildcard())
         {
             // Promote to wildcard in case it is not data lake to make it backwards compatible
-            configuration_to_initialize.partition_strategy_type = PartitionStrategyFactory::StrategyType::WILDCARD;
+            setPartitionStrategyType(PartitionStrategyFactory::StrategyType::WILDCARD);
         }
     }
 
-    if (configuration_to_initialize.format == "auto")
+    if (format == "auto")
     {
-        if (configuration_to_initialize.isDataLakeConfiguration())
+        if (isDataLakeConfiguration())
         {
-            configuration_to_initialize.format = "Parquet";
+            format = "Parquet";
         }
         else
         {
-            configuration_to_initialize.format
+            format
                 = FormatFactory::instance()
-                      .tryGetFormatFromFileName(configuration_to_initialize.isArchive() ? configuration_to_initialize.getPathInArchive() : configuration_to_initialize.getRawPath().path)
+                      .tryGetFormatFromFileName(isArchive() ? getPathInArchive() : getRawPath().path)
                       .value_or("auto");
         }
     }
     else
-        FormatFactory::instance().checkFormatName(configuration_to_initialize.format);
+        FormatFactory::instance().checkFormatName(format);
 
     /// It might be changed on `StorageObjectStorageConfiguration::initPartitionStrategy`
     /// We shouldn't set path for disk setup because path prefix is already set in used object_storage.
     if (disk_name.empty())
-        configuration_to_initialize.read_path = configuration_to_initialize.getRawPath();
+        read_path = getRawPath();
 
-    configuration_to_initialize.initialized = true;
+    initialized = true;
 }
 
 void StorageObjectStorageConfiguration::initPartitionStrategy(ASTPtr partition_by, const ColumnsDescription & columns, ContextPtr context)
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
index c1dd04340c06..239f00812a8d 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
@@ -77,8 +77,7 @@ class StorageObjectStorageConfiguration
     using Paths = std::vector<Path>;
 
     /// Initialize configuration from either AST or NamedCollection.
-    static void initialize(
-        StorageObjectStorageConfiguration & configuration_to_initialize,
+    virtual void initialize(
         ASTs & engine_args,
         ContextPtr local_context,
         bool with_table_structure);
@@ -99,11 +98,11 @@ class StorageObjectStorageConfiguration
     /// Raw URI, specified by a user. Used in permission check.
     virtual const String & getRawURI() const = 0;
 
-    const Path & getPathForRead() const;
+    virtual const Path & getPathForRead() const;
     // Path used for writing, it should not be globbed and might contain a partition key
-    Path getPathForWrite(const std::string & partition_id = "") const;
+    virtual Path getPathForWrite(const std::string & partition_id = "") const;
 
-    void setPathForRead(const Path & path)
+    virtual void setPathForRead(const Path & path)
     {
         read_path = path;
     }
@@ -125,10 +124,10 @@ class StorageObjectStorageConfiguration
     virtual void addStructureAndFormatToArgsIfNeeded(
         ASTs & args, const String & structure_, const String & format_, ContextPtr context, bool with_structure) = 0;
 
-    bool isNamespaceWithGlobs() const;
+    virtual bool isNamespaceWithGlobs() const;
 
     virtual bool isArchive() const { return false; }
-    bool isPathInArchiveWithGlobs() const;
+    virtual bool isPathInArchiveWithGlobs() const;
     virtual std::string getPathInArchive() const;
 
     virtual void check(ContextPtr context);
@@ -175,7 +174,7 @@ class StorageObjectStorageConfiguration
         ContextPtr local_context,
         const PrepareReadingFromFormatHiveParams & hive_parameters);
 
-    void initPartitionStrategy(ASTPtr partition_by, const ColumnsDescription & columns, ContextPtr context);
+    virtual void initPartitionStrategy(ASTPtr partition_by, const ColumnsDescription & columns, ContextPtr context);
 
     virtual StorageInMemoryMetadata getStorageSnapshotMetadata(ContextPtr local_context) const;
     virtual std::optional<ColumnsDescription> tryGetTableStructureFromMetadata(ContextPtr local_context) const;
@@ -246,6 +245,45 @@ class StorageObjectStorageConfiguration
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method getDataLakeSettings() is not implemented for configuration type {}", getTypeName());
     }
 
+    /// Create arguments for table function with path and access parameters
+    virtual ASTPtr createArgsWithAccessData() const
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method createArgsWithAccessData is not supported by storage {}", getEngineName());
+    }
+
+    virtual void fromNamedCollection(const NamedCollection & collection, ContextPtr context) = 0;
+    virtual void fromAST(ASTs & args, ContextPtr context, bool with_structure) = 0;
+
+    virtual ObjectStorageType extractDynamicStorageType(ASTs & /* args */, ContextPtr /* context */, ASTPtr * /* type_arg */) const
+    { return ObjectStorageType::None; }
+
+    virtual const String & getFormat() const { return format; }
+    virtual const String & getCompressionMethod() const { return compression_method; }
+    virtual const String & getStructure() const { return structure; }
+
+    virtual PartitionStrategyFactory::StrategyType getPartitionStrategyType() const { return partition_strategy_type; }
+    virtual bool getPartitionColumnsInDataFile() const { return partition_columns_in_data_file; }
+    virtual std::shared_ptr<IPartitionStrategy> getPartitionStrategy() const { return partition_strategy; }
+
+    virtual void setFormat(const String & format_) { format = format_; }
+    virtual void setCompressionMethod(const String & compression_method_) { compression_method = compression_method_; }
+    virtual void setStructure(const String & structure_) { structure = structure_; }
+
+    virtual void setPartitionStrategyType(PartitionStrategyFactory::StrategyType partition_strategy_type_)
+    {
+        partition_strategy_type = partition_strategy_type_;
+    }
+    virtual void setPartitionColumnsInDataFile(bool partition_columns_in_data_file_)
+    {
+        partition_columns_in_data_file = partition_columns_in_data_file_;
+    }
+    virtual void setPartitionStrategy(const std::shared_ptr<IPartitionStrategy> & partition_strategy_)
+    {
+        partition_strategy = partition_strategy_;
+    }
+
+    virtual void assertInitialized() const;
+
     virtual ColumnMapperPtr getColumnMapperForObject(ObjectInfoPtr /**/) const { return nullptr; }
 
     virtual ColumnMapperPtr getColumnMapperForCurrentSchema(StorageMetadataPtr /**/, ContextPtr /**/) const { return nullptr; }
@@ -260,6 +298,7 @@ class StorageObjectStorageConfiguration
 
     virtual void drop(ContextPtr) {}
 
+private:
     String format = "auto";
     String compression_method = "auto";
     String structure = "auto";
@@ -271,15 +310,11 @@ class StorageObjectStorageConfiguration
 
 protected:
     void initializeFromParsedArguments(const StorageParsedArguments & parsed_arguments);
-    virtual void fromNamedCollection(const NamedCollection & collection, ContextPtr context) = 0;
-    virtual void fromAST(ASTs & args, ContextPtr context, bool with_structure) = 0;
     virtual void fromDisk(const String & /*disk_name*/, ASTs & /*args*/, ContextPtr /*context*/, bool /*with_structure*/)
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "method fromDisk is not implemented");
     }
 
-    void assertInitialized() const;
-
     bool initialized = false;
 
 private:
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageSettings.h b/src/Storages/ObjectStorage/StorageObjectStorageSettings.h
index 1314b7d87c3d..180d71ea0c8a 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageSettings.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageSettings.h
@@ -68,7 +68,17 @@ struct StorageObjectStorageSettings
 
 using StorageObjectStorageSettingsPtr = std::shared_ptr<StorageObjectStorageSettings>;
 
+// clang-format off
+
+#define STORAGE_OBJECT_STORAGE_RELATED_SETTINGS(DECLARE, ALIAS) \
+    DECLARE(String, object_storage_cluster, "", R"(
+Cluster for distributed requests
+)", 0) \
+
+// clang-format on
+
 #define LIST_OF_STORAGE_OBJECT_STORAGE_SETTINGS(M, ALIAS) \
+    STORAGE_OBJECT_STORAGE_RELATED_SETTINGS(M, ALIAS) \
     LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageSink.cpp b/src/Storages/ObjectStorage/StorageObjectStorageSink.cpp
index 2e4fee714f6c..c629bf899f09 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageSink.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageSink.cpp
@@ -142,7 +142,7 @@ PartitionedStorageObjectStorageSink::PartitionedStorageObjectStorageSink(
     std::optional<FormatSettings> format_settings_,
     SharedHeader sample_block_,
     ContextPtr context_)
-    : PartitionedSink(configuration_->partition_strategy, context_, sample_block_)
+    : PartitionedSink(configuration_->getPartitionStrategy(), context_, sample_block_)
     , object_storage(object_storage_)
     , configuration(configuration_)
     , query_settings(configuration_->getQuerySettings(context_))
@@ -177,8 +177,8 @@ SinkPtr PartitionedStorageObjectStorageSink::createSinkForPartition(const String
         format_settings,
         std::make_shared<Block>(partition_strategy->getFormatHeader()),
         context,
-        configuration->format,
-        configuration->compression_method);
+        configuration->getFormat(),
+        configuration->getCompressionMethod());
 }
 
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageSource.cpp b/src/Storages/ObjectStorage/StorageObjectStorageSource.cpp
index 580e102544e1..87c768ac1fec 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageSource.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageSource.cpp
@@ -179,6 +179,8 @@ std::shared_ptr<IObjectIterator> StorageObjectStorageSource::createFileIterator(
         return distributed_iterator;
     }
 
+    configuration->update(object_storage, local_context, true);
+
     std::unique_ptr<IObjectIterator> iterator;
     const auto & reading_path = configuration->getPathForRead();
     if (reading_path.hasGlobs() && hasExactlyOneBracketsExpansion(reading_path.path))
@@ -471,7 +473,7 @@ void StorageObjectStorageSource::addNumRowsToCache(const ObjectInfo & object_inf
 {
     const auto cache_key = getKeyForSchemaCache(
         getUniqueStoragePathIdentifier(*configuration, object_info),
-        object_info.getFileFormat().value_or(configuration->format),
+        object_info.getFileFormat().value_or(configuration->getFormat()),
         format_settings,
         read_context);
     schema_cache.addNumRows(cache_key, num_rows);
@@ -549,7 +551,7 @@ StorageObjectStorageSource::ReaderHolder StorageObjectStorageSource::createReade
 
         const auto cache_key = getKeyForSchemaCache(
             getUniqueStoragePathIdentifier(*configuration, *object_info),
-            object_info->getFileFormat().value_or(configuration->format),
+            object_info->getFileFormat().value_or(configuration->getFormat()),
             format_settings,
             context_);
 
@@ -584,13 +586,13 @@ StorageObjectStorageSource::ReaderHolder StorageObjectStorageSource::createReade
         CompressionMethod compression_method;
         if (const auto * object_info_in_archive = dynamic_cast<const ArchiveIterator::ObjectInfoInArchive *>(object_info.get()))
         {
-            compression_method = chooseCompressionMethod(configuration->getPathInArchive(), configuration->compression_method);
+            compression_method = chooseCompressionMethod(configuration->getPathInArchive(), configuration->getCompressionMethod());
             const auto & archive_reader = object_info_in_archive->archive_reader;
             read_buf = archive_reader->readFile(object_info_in_archive->path_in_archive, /*throw_on_not_found=*/true);
         }
         else
         {
-            compression_method = chooseCompressionMethod(object_info->getFileName(), configuration->compression_method);
+            compression_method = chooseCompressionMethod(object_info->getFileName(), configuration->getCompressionMethod());
             read_buf = createReadBuffer(object_info->relative_path_with_metadata, object_storage, context_, log);
         }
 
@@ -622,10 +624,10 @@ StorageObjectStorageSource::ReaderHolder StorageObjectStorageSource::createReade
             "Reading object '{}', size: {} bytes, with format: {}",
             object_info->getPath(),
             object_info->getObjectMetadata()->size_bytes,
-            object_info->getFileFormat().value_or(configuration->format));
+            object_info->getFileFormat().value_or(configuration->getFormat()));
 
         auto input_format = FormatFactory::instance().getInput(
-            object_info->getFileFormat().value_or(configuration->format),
+            object_info->getFileFormat().value_or(configuration->getFormat()),
             *read_buf,
             initial_header,
             context_,
diff --git a/src/Storages/ObjectStorage/Utils.cpp b/src/Storages/ObjectStorage/Utils.cpp
index f1cb422e2cd2..542329f76944 100644
--- a/src/Storages/ObjectStorage/Utils.cpp
+++ b/src/Storages/ObjectStorage/Utils.cpp
@@ -60,14 +60,13 @@ std::optional<String> checkAndGetNewFileOnInsertIfNeeded(
 
 void resolveSchemaAndFormat(
     ColumnsDescription & columns,
-    std::string & format,
     ObjectStoragePtr object_storage,
-    const StorageObjectStorageConfigurationPtr & configuration,
+    StorageObjectStorageConfigurationPtr & configuration,
     std::optional<FormatSettings> format_settings,
     std::string & sample_path,
     const ContextPtr & context)
 {
-    if (format == "auto")
+    if (configuration->getFormat() == "auto")
     {
         if (configuration->isDataLakeConfiguration())
         {
@@ -89,21 +88,23 @@ void resolveSchemaAndFormat(
 
         if (columns.empty())
         {
-            if (format == "auto")
+            if (configuration->getFormat() == "auto")
             {
+                std::string format;
                 std::tie(columns, format) = StorageObjectStorage::resolveSchemaAndFormatFromData(
                     object_storage, configuration, format_settings, sample_path, context);
+                configuration->setFormat(format);
             }
             else
             {
-                chassert(!format.empty());
+                chassert(!configuration->getFormat().empty());
                 columns = StorageObjectStorage::resolveSchemaFromData(object_storage, configuration, format_settings, sample_path, context);
             }
         }
     }
-    else if (format == "auto")
+    else if (configuration->getFormat() == "auto")
     {
-        format = StorageObjectStorage::resolveFormatFromData(object_storage, configuration, format_settings, sample_path, context);
+        configuration->setFormat(StorageObjectStorage::resolveFormatFromData(object_storage, configuration, format_settings, sample_path, context));
     }
 
     validateSupportedColumns(columns, *configuration);
diff --git a/src/Storages/ObjectStorage/Utils.h b/src/Storages/ObjectStorage/Utils.h
index 3045c8ec74f4..5cc48a5d581d 100644
--- a/src/Storages/ObjectStorage/Utils.h
+++ b/src/Storages/ObjectStorage/Utils.h
@@ -16,9 +16,8 @@ std::optional<std::string> checkAndGetNewFileOnInsertIfNeeded(
 
 void resolveSchemaAndFormat(
     ColumnsDescription & columns,
-    std::string & format,
     ObjectStoragePtr object_storage,
-    const StorageObjectStorageConfigurationPtr & configuration,
+    StorageObjectStorageConfigurationPtr & configuration,
     std::optional<FormatSettings> format_settings,
     std::string & sample_path,
     const ContextPtr & context);
diff --git a/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp b/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
index 04e16e30e3f8..89c2d4e71485 100644
--- a/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
+++ b/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
@@ -14,6 +14,7 @@
 #include <Storages/ObjectStorage/StorageObjectStorage.h>
 #include <Storages/ObjectStorage/StorageObjectStorageSettings.h>
 #include <Storages/ObjectStorage/StorageObjectStorageDefinitions.h>
+#include <Storages/ObjectStorage/StorageObjectStorageCluster.h>
 #include <Storages/StorageFactory.h>
 #include <Poco/Logger.h>
 #include <Disks/DiskType.h>
@@ -42,11 +43,20 @@ namespace
 // LocalObjectStorage is only supported for Iceberg Datalake operations where Avro format is required. For regular file access, use FileStorage instead.
 #if USE_AWS_S3 || USE_AZURE_BLOB_STORAGE || USE_HDFS || USE_AVRO
 
-std::shared_ptr<StorageObjectStorage>
+StoragePtr
 createStorageObjectStorage(const StorageFactory::Arguments & args, StorageObjectStorageConfigurationPtr configuration)
 {
     const auto context = args.getLocalContext();
-    StorageObjectStorageConfiguration::initialize(*configuration, args.engine_args, context, false);
+
+    std::string cluster_name;
+
+    if (args.storage_def->settings)
+    {
+        if (const auto * value = args.storage_def->settings->changes.tryGet("object_storage_cluster"))
+            cluster_name = value->safeGet<std::string>();
+    }
+
+    configuration->initialize(args.engine_args, context, false);
 
     // Use format settings from global server context + settings from
     // the SETTINGS clause of the create query. Settings from current
@@ -77,24 +87,24 @@ createStorageObjectStorage(const StorageFactory::Arguments & args, StorageObject
     ContextMutablePtr context_copy = Context::createCopy(args.getContext());
     Settings settings_copy = args.getLocalContext()->getSettingsCopy();
     context_copy->setSettings(settings_copy);
-    return std::make_shared<StorageObjectStorage>(
+    return std::make_shared<StorageObjectStorageCluster>(
+        cluster_name,
         configuration,
         // We only want to perform write actions (e.g. create a container in Azure) when the table is being created,
         // and we want to avoid it when we load the table after a server restart.
         configuration->createObjectStorage(context, /* is_readonly */ args.mode != LoadingStrictnessLevel::CREATE),
-        context_copy, /// Use global context.
         args.table_id,
         args.columns,
         args.constraints,
+        partition_by,
+        order_by,
+        context_copy, /// Use global context.
         args.comment,
         format_settings,
         args.mode,
         configuration->getCatalog(context, args.query.attach),
         args.query.if_not_exists,
-        /* is_datalake_query*/ false,
-        /* distributed_processing */ false,
-        partition_by,
-        order_by);
+        /* is_datalake_query*/ false);
 }
 
 #endif
@@ -241,9 +251,8 @@ void registerStorageIceberg(StorageFactory & factory)
                 }
             }
             else
-#if USE_AWS_S3
-                configuration = std::make_shared<StorageS3IcebergConfiguration>(storage_settings);
-#endif
+                configuration = std::make_shared<StorageIcebergConfiguration>(storage_settings);
+
             if (configuration == nullptr)
             {
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "This storage configuration is not available at this build");
@@ -386,7 +395,7 @@ void registerStorageIceberg(StorageFactory & factory)
 #if USE_PARQUET && USE_DELTA_KERNEL_RS
 void registerStorageDeltaLake(StorageFactory & factory)
 {
-#if USE_AWS_S3
+#   if USE_AWS_S3
     factory.registerStorage(
         DeltaLakeDefinition::storage_engine_name,
         [&](const StorageFactory::Arguments & args)
diff --git a/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.cpp b/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.cpp
index b3821dcd2ce6..0aaac41cb17e 100644
--- a/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.cpp
+++ b/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.cpp
@@ -303,12 +303,12 @@ StorageObjectStorageQueue::StorageObjectStorageQueue(
     validateSettings(*queue_settings_, is_attach);
 
     object_storage = configuration->createObjectStorage(context_, /* is_readonly */true);
-    FormatFactory::instance().checkFormatName(configuration->format);
+    FormatFactory::instance().checkFormatName(configuration->getFormat());
     configuration->check(context_);
 
     ColumnsDescription columns{columns_};
     std::string sample_path;
-    resolveSchemaAndFormat(columns, configuration->format, object_storage, configuration, format_settings, sample_path, context_);
+    resolveSchemaAndFormat(columns, object_storage, configuration, format_settings, sample_path, context_);
     configuration->check(context_);
 
     bool is_path_with_hive_partitioning = false;
@@ -356,7 +356,7 @@ StorageObjectStorageQueue::StorageObjectStorageQueue(
     auto table_metadata = ObjectStorageQueueMetadata::syncWithKeeper(
         zk_path, *queue_settings_,
         storage_metadata.getColumns(),
-        configuration_->format,
+        configuration_->getFormat(),
         context_,
         is_attach,
         log);
@@ -498,7 +498,7 @@ void StorageObjectStorageQueue::renameInMemory(const StorageID & new_table_id)
 
 bool StorageObjectStorageQueue::supportsSubsetOfColumns(const ContextPtr & context_) const
 {
-    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->format, context_, format_settings);
+    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->getFormat(), context_, format_settings);
 }
 
 class ReadFromObjectStorageQueue : public SourceStepWithFilter
diff --git a/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.h b/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.h
index 434263af5a85..83c97768c80b 100644
--- a/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.h
+++ b/src/Storages/ObjectStorageQueue/StorageObjectStorageQueue.h
@@ -58,7 +58,7 @@ class StorageObjectStorageQueue : public IStorage, WithContext
 
     void renameInMemory(const StorageID & new_table_id) override;
 
-    const auto & getFormatName() const { return configuration->format; }
+    const auto & getFormatName() const { return configuration->getFormat(); }
 
     const fs::path & getZooKeeperPath() const { return zk_path; }
 
diff --git a/src/Storages/ObjectStorageQueue/registerQueueStorage.cpp b/src/Storages/ObjectStorageQueue/registerQueueStorage.cpp
index cf128ceefc67..416e41000aca 100644
--- a/src/Storages/ObjectStorageQueue/registerQueueStorage.cpp
+++ b/src/Storages/ObjectStorageQueue/registerQueueStorage.cpp
@@ -48,7 +48,7 @@ StoragePtr createQueueStorage(const StorageFactory::Arguments & args)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "External data source must have arguments");
 
     auto configuration = std::make_shared<Configuration>();
-    StorageObjectStorageConfiguration::initialize(*configuration, args.engine_args, args.getContext(), false);
+    configuration->initialize(args.engine_args, args.getContext(), false);
 
     // Use format settings from global server context + settings from
     // the SETTINGS clause of the create query. Settings from current
diff --git a/src/Storages/System/StorageSystemIcebergHistory.cpp b/src/Storages/System/StorageSystemIcebergHistory.cpp
index 410dfcbc40a6..87b85120e668 100644
--- a/src/Storages/System/StorageSystemIcebergHistory.cpp
+++ b/src/Storages/System/StorageSystemIcebergHistory.cpp
@@ -15,7 +15,7 @@
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/ReadFromSystemNumbersStep.h>
 #include <Storages/SelectQueryInfo.h>
-#include <Storages/ObjectStorage/StorageObjectStorage.h>
+#include <Storages/ObjectStorage/StorageObjectStorageCluster.h>
 #include <Access/ContextAccess.h>
 #include <Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h>
 #include <Storages/ObjectStorage/DataLakes/Iceberg/IcebergMetadata.h>
@@ -57,7 +57,7 @@ void StorageSystemIcebergHistory::fillData([[maybe_unused]] MutableColumns & res
 
     const auto access = context_copy->getAccess();
 
-    auto add_history_record = [&](const DatabaseTablesIteratorPtr & it, StorageObjectStorage * object_storage)
+    auto add_history_record = [&](const DatabaseTablesIteratorPtr & it, StorageObjectStorageCluster * object_storage)
     {
         if (!access->isGranted(AccessType::SHOW_TABLES, it->databaseName(), it->name()))
             return;
@@ -106,7 +106,7 @@ void StorageSystemIcebergHistory::fillData([[maybe_unused]] MutableColumns & res
                     // Table was dropped while acquiring the lock, skipping table
                     continue;
 
-                if (auto * object_storage_table = dynamic_cast<StorageObjectStorage *>(storage.get()))
+                if (auto * object_storage_table = dynamic_cast<StorageObjectStorageCluster *>(storage.get()))
                 {
                     add_history_record(iterator, object_storage_table);
                 }
diff --git a/src/Storages/extractTableFunctionFromSelectQuery.cpp b/src/Storages/extractTableFunctionFromSelectQuery.cpp
index 57302036c889..c7f60240b3c7 100644
--- a/src/Storages/extractTableFunctionFromSelectQuery.cpp
+++ b/src/Storages/extractTableFunctionFromSelectQuery.cpp
@@ -20,7 +20,16 @@ ASTFunction * extractTableFunctionFromSelectQuery(ASTPtr & query)
     if (!table_expression->table_function)
         return nullptr;
 
-    return table_expression->table_function->as<ASTFunction>();
+    auto * table_function = table_expression->table_function->as<ASTFunction>();
+    return table_function;
+}
+
+ASTExpressionList * extractTableFunctionArgumentsFromSelectQuery(ASTPtr & query)
+{
+    auto * table_function = extractTableFunctionFromSelectQuery(query);
+    if (!table_function)
+        return nullptr;
+    return table_function->arguments->as<ASTExpressionList>();
 }
 
 }
diff --git a/src/Storages/extractTableFunctionFromSelectQuery.h b/src/Storages/extractTableFunctionFromSelectQuery.h
index c69cc7ce6c52..87edf01c1c82 100644
--- a/src/Storages/extractTableFunctionFromSelectQuery.h
+++ b/src/Storages/extractTableFunctionFromSelectQuery.h
@@ -1,12 +1,13 @@
 #pragma once
 
 #include <Parsers/IAST_fwd.h>
-#include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTExpressionList.h>
 
 namespace DB
 {
 
 ASTFunction * extractTableFunctionFromSelectQuery(ASTPtr & query);
+ASTExpressionList * extractTableFunctionArgumentsFromSelectQuery(ASTPtr & query);
 
 }
diff --git a/src/TableFunctions/ITableFunction.h b/src/TableFunctions/ITableFunction.h
index c4e7534c1e49..f60ffd005c8b 100644
--- a/src/TableFunctions/ITableFunction.h
+++ b/src/TableFunctions/ITableFunction.h
@@ -78,7 +78,7 @@ class ITableFunction : public std::enable_shared_from_this<ITableFunction>
 
     virtual bool supportsReadingSubsetOfColumns(const ContextPtr &) { return true; }
 
-    virtual bool canBeUsedToCreateTable() const { return true; }
+    virtual void validateUseToCreateTable() const {}
 
     // INSERT INTO TABLE FUNCTION ... PARTITION BY
     // Set partition by expression so `ITableFunctionObjectStorage` can construct a proper representation
diff --git a/src/TableFunctions/ITableFunctionCluster.h b/src/TableFunctions/ITableFunctionCluster.h
index 5345e1a0f0db..975322d054b3 100644
--- a/src/TableFunctions/ITableFunctionCluster.h
+++ b/src/TableFunctions/ITableFunctionCluster.h
@@ -16,6 +16,7 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int CLUSTER_DOESNT_EXIST;
     extern const int LOGICAL_ERROR;
+    extern const int BAD_ARGUMENTS;
 }
 
 /// Base class for *Cluster table functions that require cluster_name for the first argument.
@@ -46,9 +47,13 @@ class ITableFunctionCluster : public Base
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected table function name: {}", table_function->name);
     }
 
-    bool canBeUsedToCreateTable() const override { return false; }
     bool isClusterFunction() const override { return true; }
 
+    void validateUseToCreateTable() const override
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table function '{}' cannot be used to create a table", getName());
+    }
+
 protected:
     void parseArguments(const ASTPtr & ast, ContextPtr context) override
     {
diff --git a/src/TableFunctions/TableFunctionObjectStorage.cpp b/src/TableFunctions/TableFunctionObjectStorage.cpp
index 6f8815c7f8ba..444ded628a1a 100644
--- a/src/TableFunctions/TableFunctionObjectStorage.cpp
+++ b/src/TableFunctions/TableFunctionObjectStorage.cpp
@@ -195,7 +195,7 @@ template <typename Definition, typename Configuration, bool is_data_lake>
 ColumnsDescription TableFunctionObjectStorage<
     Definition, Configuration, is_data_lake>::getActualTableStructure(ContextPtr context, bool is_insert_query) const
 {
-    if (configuration->structure == "auto")
+    if (configuration->getStructure() == "auto")
     {
         if (const auto access_object = getSourceAccessObject())
             context->checkAccess(AccessType::READ, toStringSource(*access_object));
@@ -210,7 +210,6 @@ ColumnsDescription TableFunctionObjectStorage<
         ColumnsDescription columns;
         resolveSchemaAndFormat(
             columns,
-            configuration->format,
             std::move(storage),
             configuration,
             /* format_settings */std::nullopt,
@@ -227,7 +226,7 @@ ColumnsDescription TableFunctionObjectStorage<
 
         return columns;
     }
-    return parseColumnsListFromString(configuration->structure, context);
+    return parseColumnsListFromString(configuration->getStructure(), context);
 }
 
 template <typename Definition, typename Configuration, bool is_data_lake>
@@ -241,8 +240,8 @@ StoragePtr TableFunctionObjectStorage<Definition, Configuration, is_data_lake>::
     chassert(configuration);
     ColumnsDescription columns;
 
-    if (configuration->structure != "auto")
-        columns = parseColumnsListFromString(configuration->structure, context);
+    if (configuration->getStructure() != "auto")
+        columns = parseColumnsListFromString(configuration->getStructure(), context);
     else if (!structure_hint.empty())
         columns = structure_hint;
     else if (!cached_columns.empty())
@@ -270,7 +269,14 @@ StoragePtr TableFunctionObjectStorage<Definition, Configuration, is_data_lake>::
             columns,
             ConstraintsDescription{},
             partition_by,
+            /* order_by */ nullptr,
             context,
+            /* comment */ String{},
+            /* format_settings */ std::nullopt, /// No format_settings
+            /* mode */ LoadingStrictnessLevel::CREATE,
+            configuration->getCatalog(context, /*attach*/ false),
+            /* if_not_exists */ false,
+            /* is_datalake_query*/ false,
             /* is_table_function */true);
 
         storage->startup();
@@ -321,18 +327,7 @@ void registerTableFunctionObjectStorage(TableFunctionFactory & factory)
 {
     UNUSED(factory);
 #if USE_AWS_S3
-    factory.registerFunction<TableFunctionObjectStorage<S3Definition, StorageS3Configuration>>(
-    {
-        .documentation =
-        {
-            .description=R"(The table function can be used to read the data stored on AWS S3.)",
-            .examples{{S3Definition::name, "SELECT * FROM s3(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction
-        },
-        .allow_readonly = false
-    });
-
-    factory.registerFunction<TableFunctionObjectStorage<GCSDefinition, StorageS3Configuration>>(
+    factory.registerFunction<TableFunctionObjectStorage<GCSDefinition, StorageS3Configuration, false>>(
     {
         .documentation =
         {
@@ -343,7 +338,7 @@ void registerTableFunctionObjectStorage(TableFunctionFactory & factory)
         .allow_readonly = false
     });
 
-    factory.registerFunction<TableFunctionObjectStorage<COSNDefinition, StorageS3Configuration>>(
+    factory.registerFunction<TableFunctionObjectStorage<COSNDefinition, StorageS3Configuration, false>>(
     {
         .documentation =
         {
@@ -354,7 +349,7 @@ void registerTableFunctionObjectStorage(TableFunctionFactory & factory)
         .allow_readonly = false
     });
 
-    factory.registerFunction<TableFunctionObjectStorage<OSSDefinition, StorageS3Configuration>>(
+    factory.registerFunction<TableFunctionObjectStorage<OSSDefinition, StorageS3Configuration, false>>(
     {
         .documentation =
         {
@@ -365,58 +360,28 @@ void registerTableFunctionObjectStorage(TableFunctionFactory & factory)
         .allow_readonly = false
     });
 #endif
-
-#if USE_AZURE_BLOB_STORAGE
-    factory.registerFunction<TableFunctionObjectStorage<AzureDefinition, StorageAzureConfiguration>>(
-    {
-        .documentation =
-        {
-            .description=R"(The table function can be used to read the data stored on Azure Blob Storage.)",
-            .examples{
-            {
-                AzureDefinition::name,
-                "SELECT * FROM  azureBlobStorage(connection_string|storage_account_url, container_name, blobpath, "
-                "[account_name, account_key, format, compression, structure])", ""
-            }},
-            .category = FunctionDocumentation::Category::TableFunction
-        },
-        .allow_readonly = false
-    });
-#endif
-#if USE_HDFS
-    factory.registerFunction<TableFunctionObjectStorage<HDFSDefinition, StorageHDFSConfiguration>>(
-    {
-        .documentation =
-        {
-            .description=R"(The table function can be used to read the data stored on HDFS virtual filesystem.)",
-            .examples{
-            {
-                HDFSDefinition::name,
-                "SELECT * FROM  hdfs(url, format, compression, structure])", ""
-            }},
-            .category = FunctionDocumentation::Category::TableFunction
-        },
-        .allow_readonly = false
-    });
-#endif
 }
 
 #if USE_AZURE_BLOB_STORAGE
-template class TableFunctionObjectStorage<AzureDefinition, StorageAzureConfiguration>;
-template class TableFunctionObjectStorage<AzureClusterDefinition, StorageAzureConfiguration>;
+template class TableFunctionObjectStorage<AzureDefinition, StorageAzureConfiguration, false>;
+template class TableFunctionObjectStorage<AzureClusterDefinition, StorageAzureConfiguration, false>;
 #endif
 
 #if USE_AWS_S3
-template class TableFunctionObjectStorage<S3Definition, StorageS3Configuration>;
-template class TableFunctionObjectStorage<S3ClusterDefinition, StorageS3Configuration>;
-template class TableFunctionObjectStorage<GCSDefinition, StorageS3Configuration>;
-template class TableFunctionObjectStorage<COSNDefinition, StorageS3Configuration>;
-template class TableFunctionObjectStorage<OSSDefinition, StorageS3Configuration>;
+template class TableFunctionObjectStorage<S3Definition, StorageS3Configuration, false>;
+template class TableFunctionObjectStorage<S3ClusterDefinition, StorageS3Configuration, false>;
+template class TableFunctionObjectStorage<GCSDefinition, StorageS3Configuration, false>;
+template class TableFunctionObjectStorage<COSNDefinition, StorageS3Configuration, false>;
+template class TableFunctionObjectStorage<OSSDefinition, StorageS3Configuration, false>;
 #endif
 
 #if USE_HDFS
-template class TableFunctionObjectStorage<HDFSDefinition, StorageHDFSConfiguration>;
-template class TableFunctionObjectStorage<HDFSClusterDefinition, StorageHDFSConfiguration>;
+template class TableFunctionObjectStorage<HDFSDefinition, StorageHDFSConfiguration, false>;
+template class TableFunctionObjectStorage<HDFSClusterDefinition, StorageHDFSConfiguration, false>;
+#endif
+
+#if USE_AVRO
+template class TableFunctionObjectStorage<IcebergClusterDefinition, StorageIcebergConfiguration, true>;
 #endif
 
 #if USE_AVRO
@@ -465,37 +430,6 @@ template class TableFunctionObjectStorage<HudiClusterDefinition, StorageS3HudiCo
 #if USE_AVRO
 void registerTableFunctionIceberg(TableFunctionFactory & factory)
 {
-#if USE_AWS_S3
-    factory.registerFunction<TableFunctionIceberg>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored on S3 object store. Alias to icebergS3)",
-            .examples{{IcebergDefinition::name, "SELECT * FROM iceberg(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-    factory.registerFunction<TableFunctionIcebergS3>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored on S3 object store.)",
-            .examples{{IcebergS3Definition::name, "SELECT * FROM icebergS3(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-
-#endif
-#if USE_AZURE_BLOB_STORAGE
-    factory.registerFunction<TableFunctionIcebergAzure>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored on Azure object store.)",
-            .examples{{IcebergAzureDefinition::name, "SELECT * FROM icebergAzure(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-#endif
-#if USE_HDFS
-    factory.registerFunction<TableFunctionIcebergHDFS>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored on HDFS virtual filesystem.)",
-            .examples{{IcebergHDFSDefinition::name, "SELECT * FROM icebergHDFS(url)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-#endif
     factory.registerFunction<TableFunctionIcebergLocal>(
         {.documentation
          = {.description = R"(The table function can be used to read the Iceberg table stored locally.)",
@@ -549,56 +483,6 @@ void registerTableFunctionPaimon(TableFunctionFactory & factory)
 }
 #endif
 
-#if USE_PARQUET && USE_DELTA_KERNEL_RS
-void registerTableFunctionDeltaLake(TableFunctionFactory & factory)
-{
-#if USE_AWS_S3
-    factory.registerFunction<TableFunctionDeltaLake>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the DeltaLake table stored on S3, alias of deltaLakeS3.)",
-            .examples{{DeltaLakeDefinition::name, "SELECT * FROM deltaLake(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-
-    factory.registerFunction<TableFunctionDeltaLakeS3>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the DeltaLake table stored on S3.)",
-            .examples{{DeltaLakeS3Definition::name, "SELECT * FROM deltaLakeS3(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-#endif
-
-#if USE_AZURE_BLOB_STORAGE
-    factory.registerFunction<TableFunctionDeltaLakeAzure>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the DeltaLake table stored on Azure object store.)",
-            .examples{{DeltaLakeAzureDefinition::name, "SELECT * FROM deltaLakeAzure(connection_string|storage_account_url, container_name, blobpath, \"\n"
- "                \"[account_name, account_key, format, compression, structure])", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-#endif
-    // Register the new local Delta Lake table function
-    factory.registerFunction<TableFunctionDeltaLakeLocal>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the DeltaLake table stored locally.)",
-            .examples{{DeltaLakeLocalDefinition::name, "SELECT * FROM deltaLakeLocal(path)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-}
-#endif
-
-#if USE_AWS_S3
-void registerTableFunctionHudi(TableFunctionFactory & factory)
-{
-    factory.registerFunction<TableFunctionHudi>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Hudi table stored on object store.)",
-            .examples{{HudiDefinition::name, "SELECT * FROM hudi(url, access_key_id, secret_access_key)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-}
-#endif
-
 void registerDataLakeTableFunctions(TableFunctionFactory & factory)
 {
     UNUSED(factory);
@@ -609,12 +493,5 @@ void registerDataLakeTableFunctions(TableFunctionFactory & factory)
 #if USE_AVRO
     registerTableFunctionPaimon(factory);
 #endif
-
-#if USE_PARQUET && USE_DELTA_KERNEL_RS
-    registerTableFunctionDeltaLake(factory);
-#endif
-#if USE_AWS_S3
-    registerTableFunctionHudi(factory);
-#endif
 }
 }
diff --git a/src/TableFunctions/TableFunctionObjectStorage.h b/src/TableFunctions/TableFunctionObjectStorage.h
index b3a0a682746b..691f4d44d9a0 100644
--- a/src/TableFunctions/TableFunctionObjectStorage.h
+++ b/src/TableFunctions/TableFunctionObjectStorage.h
@@ -37,15 +37,16 @@ class TableFunctionObjectStorage : public ITableFunction
 
     String getName() const override { return name; }
 
-    bool hasStaticStructure() const override { return configuration->structure != "auto"; }
+    bool hasStaticStructure() const override { return configuration->getStructure() != "auto"; }
 
-    bool needStructureHint() const override { return configuration->structure == "auto"; }
+    bool needStructureHint() const override { return configuration->getStructure() == "auto"; }
 
     void setStructureHint(const ColumnsDescription & structure_hint_) override { structure_hint = structure_hint_; }
 
     bool supportsReadingSubsetOfColumns(const ContextPtr & context) override
     {
-        return configuration->format != "auto" && FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->format, context);
+        return configuration->getFormat() != "auto"
+            && FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration->getFormat(), context);
     }
 
     std::unordered_set<String> getVirtualsToCheckBeforeUsingStructureHint() const override
@@ -55,7 +56,7 @@ class TableFunctionObjectStorage : public ITableFunction
 
     virtual void parseArgumentsImpl(ASTs & args, const ContextPtr & context)
     {
-        StorageObjectStorageConfiguration::initialize(*getConfiguration(context), args, context, true);
+        getConfiguration(context)->initialize(args, context, true);
     }
 
     static void updateStructureAndFormatArgumentsIfNeeded(
@@ -67,8 +68,8 @@ class TableFunctionObjectStorage : public ITableFunction
         if constexpr (is_data_lake)
         {
             Configuration configuration(createEmptySettings());
-            if (configuration.format == "auto")
-                configuration.format = "Parquet"; /// Default format of data lakes.
+            if (configuration.getFormat() == "auto")
+                configuration.setFormat("Parquet"); /// Default format of data lakes.
 
             configuration.addStructureAndFormatToArgsIfNeeded(args, structure, format, context, /*with_structure=*/true);
         }
@@ -110,21 +111,22 @@ class TableFunctionObjectStorage : public ITableFunction
 };
 
 #if USE_AWS_S3
-using TableFunctionS3 = TableFunctionObjectStorage<S3Definition, StorageS3Configuration>;
+using TableFunctionS3 = TableFunctionObjectStorage<S3Definition, StorageS3Configuration, false>;
 #endif
 
 #if USE_AZURE_BLOB_STORAGE
-using TableFunctionAzureBlob = TableFunctionObjectStorage<AzureDefinition, StorageAzureConfiguration>;
+using TableFunctionAzureBlob = TableFunctionObjectStorage<AzureDefinition, StorageAzureConfiguration, false>;
 #endif
 
 #if USE_HDFS
-using TableFunctionHDFS = TableFunctionObjectStorage<HDFSDefinition, StorageHDFSConfiguration>;
+using TableFunctionHDFS = TableFunctionObjectStorage<HDFSDefinition, StorageHDFSConfiguration, false>;
 #endif
 
 
 #if USE_AVRO
+using TableFunctionIceberg = TableFunctionObjectStorage<IcebergDefinition, StorageIcebergConfiguration, true>;
+
 #    if USE_AWS_S3
-using TableFunctionIceberg = TableFunctionObjectStorage<IcebergDefinition, StorageS3IcebergConfiguration, true>;
 using TableFunctionIcebergS3 = TableFunctionObjectStorage<IcebergS3Definition, StorageS3IcebergConfiguration, true>;
 #    endif
 #    if USE_AZURE_BLOB_STORAGE
@@ -149,13 +151,13 @@ using TableFunctionPaimonHDFS = TableFunctionObjectStorage<PaimonHDFSDefinition,
 using TableFunctionPaimonLocal = TableFunctionObjectStorage<PaimonLocalDefinition, StorageLocalPaimonConfiguration, true>;
 #endif
 #if USE_PARQUET && USE_DELTA_KERNEL_RS
-#if USE_AWS_S3
+#    if USE_AWS_S3
 using TableFunctionDeltaLake = TableFunctionObjectStorage<DeltaLakeDefinition, StorageS3DeltaLakeConfiguration, true>;
 using TableFunctionDeltaLakeS3 = TableFunctionObjectStorage<DeltaLakeS3Definition, StorageS3DeltaLakeConfiguration, true>;
-#endif
-#if USE_AZURE_BLOB_STORAGE
+#    endif
+#    if USE_AZURE_BLOB_STORAGE
 using TableFunctionDeltaLakeAzure = TableFunctionObjectStorage<DeltaLakeAzureDefinition, StorageAzureDeltaLakeConfiguration, true>;
-#endif
+#    endif
 // New alias for local Delta Lake table function
 using TableFunctionDeltaLakeLocal = TableFunctionObjectStorage<DeltaLakeLocalDefinition, StorageLocalDeltaLakeConfiguration, true>;
 #endif
diff --git a/src/TableFunctions/TableFunctionObjectStorageCluster.cpp b/src/TableFunctions/TableFunctionObjectStorageCluster.cpp
index 830ca1ad5cb8..758a5ddfe778 100644
--- a/src/TableFunctions/TableFunctionObjectStorageCluster.cpp
+++ b/src/TableFunctions/TableFunctionObjectStorageCluster.cpp
@@ -22,8 +22,9 @@ StoragePtr TableFunctionObjectStorageCluster<Definition, Configuration, is_data_
     auto configuration = Base::getConfiguration(context);
 
     ColumnsDescription columns;
-    if (configuration->structure != "auto")
-        columns = parseColumnsListFromString(configuration->structure, context);
+
+    if (configuration->getStructure() != "auto")
+        columns = parseColumnsListFromString(configuration->getStructure(), context);
     else if (!Base::structure_hint.empty())
         columns = Base::structure_hint;
     else if (!cached_columns.empty())
@@ -70,8 +71,16 @@ StoragePtr TableFunctionObjectStorageCluster<Definition, Configuration, is_data_
             columns,
             ConstraintsDescription{},
             Base::partition_by,
+            /* order_by */ nullptr,
             context,
-            /* is_table_function */true);
+            /* comment */ String{},
+            /* format_settings */ std::nullopt, /// No format_settings
+            /* mode */ LoadingStrictnessLevel::CREATE,
+            /* catalog*/ nullptr,
+            /* if_not_exists */ false,
+            /* is_datalake_query*/ false,
+            /* is_table_function */ true,
+            /* lazy_init */ true);
     }
 
     storage->startup();
@@ -139,39 +148,49 @@ void registerTableFunctionIcebergCluster(TableFunctionFactory & factory)
             .category = FunctionDocumentation::Category::TableFunction},
          .allow_readonly = false});
 
-#if USE_AWS_S3
     factory.registerFunction<TableFunctionIcebergCluster>(
         {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored on store from disk in parallel for many nodes in a specified cluster.)",
-            .examples{{IcebergClusterDefinition::name, "SELECT * FROM icebergCluster(cluster) SETTINGS disk = 'disk'", ""},{IcebergClusterDefinition::name, "SELECT * FROM icebergCluster(cluster, url, [, NOSIGN | access_key_id, secret_access_key, [session_token]], format, [,compression])", ""}},
+         = {.description = R"(The table function can be used to read the Iceberg table stored on any object store in parallel for many nodes in a specified cluster.)",
+            .examples{
+#   if USE_AWS_S3
+                {"icebergCluster", "SELECT * FROM icebergCluster(cluster, url, [, NOSIGN | access_key_id, secret_access_key, [session_token]], format, [,compression], storage_type='s3')", ""},
+#   endif
+#   if USE_AZURE_BLOB_STORAGE
+                {"icebergCluster", "SELECT * FROM icebergCluster(cluster, connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression], storage_type='azure')", ""},
+#   endif
+#   if USE_HDFS
+                {"icebergCluster", "SELECT * FROM icebergCluster(cluster, uri, [format], [structure], [compression_method], storage_type='hdfs')", ""},
+#   endif
+            },
             .category = FunctionDocumentation::Category::TableFunction},
          .allow_readonly = false});
 
+#   if USE_AWS_S3
     factory.registerFunction<TableFunctionIcebergS3Cluster>(
         {.documentation
          = {.description = R"(The table function can be used to read the Iceberg table stored on S3 object store in parallel for many nodes in a specified cluster.)",
             .examples{{IcebergS3ClusterDefinition::name, "SELECT * FROM icebergS3Cluster(cluster, url, [, NOSIGN | access_key_id, secret_access_key, [session_token]], format, [,compression])", ""}},
             .category = FunctionDocumentation::Category::TableFunction},
          .allow_readonly = false});
-#endif
+#   endif
 
-#if USE_AZURE_BLOB_STORAGE
+#   if USE_AZURE_BLOB_STORAGE
     factory.registerFunction<TableFunctionIcebergAzureCluster>(
         {.documentation
          = {.description = R"(The table function can be used to read the Iceberg table stored on Azure object store in parallel for many nodes in a specified cluster.)",
             .examples{{IcebergAzureClusterDefinition::name, "SELECT * FROM icebergAzureCluster(cluster, connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression])", ""}},
             .category = FunctionDocumentation::Category::TableFunction},
          .allow_readonly = false});
-#endif
+#   endif
 
-#if USE_HDFS
+#   if USE_HDFS
     factory.registerFunction<TableFunctionIcebergHDFSCluster>(
         {.documentation
          = {.description = R"(The table function can be used to read the Iceberg table stored on HDFS virtual filesystem in parallel for many nodes in a specified cluster.)",
             .examples{{IcebergHDFSClusterDefinition::name, "SELECT * FROM icebergHDFSCluster(cluster, uri, [format], [structure], [compression_method])", ""}},
             .category = FunctionDocumentation::Category::TableFunction},
          .allow_readonly = false});
-#endif
+#   endif
 }
 
 void registerTableFunctionPaimonCluster(TableFunctionFactory & factory)
diff --git a/src/TableFunctions/TableFunctionObjectStorageCluster.h b/src/TableFunctions/TableFunctionObjectStorageCluster.h
index 06a83fc19ef8..483fe2636227 100644
--- a/src/TableFunctions/TableFunctionObjectStorageCluster.h
+++ b/src/TableFunctions/TableFunctionObjectStorageCluster.h
@@ -13,8 +13,6 @@ namespace DB
 
 class Context;
 
-class StorageS3Settings;
-class StorageAzureBlobSettings;
 class StorageS3Configuration;
 class StorageAzureConfiguration;
 
@@ -46,8 +44,8 @@ class TableFunctionObjectStorageCluster : public ITableFunctionCluster<TableFunc
 
     const char * getStorageEngineName() const override { return Definition::storage_engine_name; }
     const char * getNonClusteredStorageEngineName() const override { return Definition::non_clustered_storage_engine_name; }
-    bool hasStaticStructure() const override { return Base::getConfiguration(getQueryOrGlobalContext())->structure != "auto"; }
-    bool needStructureHint() const override { return Base::getConfiguration(getQueryOrGlobalContext())->structure == "auto"; }
+    bool hasStaticStructure() const override { return Base::getConfiguration(getQueryOrGlobalContext())->getStructure() != "auto"; }
+    bool needStructureHint() const override { return Base::getConfiguration(getQueryOrGlobalContext())->getStructure() == "auto"; }
     void setStructureHint(const ColumnsDescription & structure_hint_) override { Base::structure_hint = structure_hint_; }
 private:
     static ContextPtr getQueryOrGlobalContext()
@@ -59,15 +57,19 @@ class TableFunctionObjectStorageCluster : public ITableFunctionCluster<TableFunc
 };
 
 #if USE_AWS_S3
-using TableFunctionS3Cluster = TableFunctionObjectStorageCluster<S3ClusterDefinition, StorageS3Configuration>;
+using TableFunctionS3Cluster = TableFunctionObjectStorageCluster<S3ClusterDefinition, StorageS3Configuration, false>;
 #endif
 
 #if USE_AZURE_BLOB_STORAGE
-using TableFunctionAzureBlobCluster = TableFunctionObjectStorageCluster<AzureClusterDefinition, StorageAzureConfiguration>;
+using TableFunctionAzureBlobCluster = TableFunctionObjectStorageCluster<AzureClusterDefinition, StorageAzureConfiguration, false>;
 #endif
 
 #if USE_HDFS
-using TableFunctionHDFSCluster = TableFunctionObjectStorageCluster<HDFSClusterDefinition, StorageHDFSConfiguration>;
+using TableFunctionHDFSCluster = TableFunctionObjectStorageCluster<HDFSClusterDefinition, StorageHDFSConfiguration, false>;
+#endif
+
+#if USE_AVRO
+using TableFunctionIcebergCluster = TableFunctionObjectStorageCluster<IcebergClusterDefinition, StorageIcebergConfiguration, true>;
 #endif
 
 #if USE_AVRO
@@ -76,7 +78,6 @@ using TableFunctionIcebergLocalCluster = TableFunctionObjectStorageCluster<Icebe
 
 #if USE_AVRO && USE_AWS_S3
 using TableFunctionIcebergS3Cluster = TableFunctionObjectStorageCluster<IcebergS3ClusterDefinition, StorageS3IcebergConfiguration, true>;
-using TableFunctionIcebergCluster = TableFunctionObjectStorageCluster<IcebergClusterDefinition, StorageS3IcebergConfiguration, true>;
 #endif
 
 #if USE_AVRO && USE_AZURE_BLOB_STORAGE
@@ -101,7 +102,7 @@ using TableFunctionPaimonHDFSCluster = TableFunctionObjectStorageCluster<PaimonH
 #endif
 
 
-#if USE_AWS_S3 && USE_PARQUET && USE_DELTA_KERNEL_RS
+#if USE_AWS_S3 && USE_PARQUET
 using TableFunctionDeltaLakeCluster = TableFunctionObjectStorageCluster<DeltaLakeClusterDefinition, StorageS3DeltaLakeConfiguration, true>;
 using TableFunctionDeltaLakeS3Cluster = TableFunctionObjectStorageCluster<DeltaLakeS3ClusterDefinition, StorageS3DeltaLakeConfiguration, true>;
 #endif
diff --git a/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
new file mode 100644
index 000000000000..26c29fe7cff6
--- /dev/null
+++ b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
@@ -0,0 +1,449 @@
+#include <Core/Settings.h>
+#include <TableFunctions/TableFunctionFactory.h>
+#include <TableFunctions/TableFunctionObjectStorageClusterFallback.h>
+#include <Common/typeid_cast.h>
+#include <Storages/ObjectStorage/StorageObjectStorageCluster.h>
+
+namespace DB
+{
+
+namespace Setting
+{
+    extern const SettingsString object_storage_cluster;
+}
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+}
+
+struct S3ClusterFallbackDefinition
+{
+    static constexpr auto name = "s3";
+    static constexpr auto storage_engine_name = "S3";
+    static constexpr auto storage_engine_cluster_name = "S3Cluster";
+};
+
+struct AzureClusterFallbackDefinition
+{
+    static constexpr auto name = "azureBlobStorage";
+    static constexpr auto storage_engine_name = "Azure";
+    static constexpr auto storage_engine_cluster_name = "AzureBlobStorageCluster";
+};
+
+struct HDFSClusterFallbackDefinition
+{
+    static constexpr auto name = "hdfs";
+    static constexpr auto storage_engine_name = "HDFS";
+    static constexpr auto storage_engine_cluster_name = "HDFSCluster";
+};
+
+struct IcebergClusterFallbackDefinition
+{
+    static constexpr auto name = "iceberg";
+    static constexpr auto storage_engine_name = "UNDEFINED";
+    static constexpr auto storage_engine_cluster_name = "IcebergCluster";
+};
+
+struct IcebergS3ClusterFallbackDefinition
+{
+    static constexpr auto name = "icebergS3";
+    static constexpr auto storage_engine_name = "S3";
+    static constexpr auto storage_engine_cluster_name = "IcebergS3Cluster";
+};
+
+struct IcebergAzureClusterFallbackDefinition
+{
+    static constexpr auto name = "icebergAzure";
+    static constexpr auto storage_engine_name = "Azure";
+    static constexpr auto storage_engine_cluster_name = "IcebergAzureCluster";
+};
+
+struct IcebergHDFSClusterFallbackDefinition
+{
+    static constexpr auto name = "icebergHDFS";
+    static constexpr auto storage_engine_name = "HDFS";
+    static constexpr auto storage_engine_cluster_name = "IcebergHDFSCluster";
+};
+
+struct DeltaLakeClusterFallbackDefinition
+{
+    static constexpr auto name = "deltaLake";
+    static constexpr auto storage_engine_name = "S3";
+    static constexpr auto storage_engine_cluster_name = "DeltaLakeS3Cluster";
+};
+
+struct DeltaLakeS3ClusterFallbackDefinition
+{
+    static constexpr auto name = "deltaLakeS3";
+    static constexpr auto storage_engine_name = "S3";
+    static constexpr auto storage_engine_cluster_name = "DeltaLakeS3Cluster";
+};
+
+struct DeltaLakeAzureClusterFallbackDefinition
+{
+    static constexpr auto name = "deltaLakeAzure";
+    static constexpr auto storage_engine_name = "Azure";
+    static constexpr auto storage_engine_cluster_name = "DeltaLakeAzureCluster";
+};
+
+struct HudiClusterFallbackDefinition
+{
+    static constexpr auto name = "hudi";
+    static constexpr auto storage_engine_name = "S3";
+    static constexpr auto storage_engine_cluster_name = "HudiS3Cluster";
+};
+
+template <typename Definition, typename Base>
+void TableFunctionObjectStorageClusterFallback<Definition, Base>::parseArgumentsImpl(ASTs & args, const ContextPtr & context)
+{
+    if (args.empty())
+        throw Exception(
+            ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            "The function {} should have arguments. The first argument must be the cluster name and the rest are the arguments of "
+            "corresponding table function",
+            getName());
+
+    const auto & settings = context->getSettingsRef();
+
+    is_cluster_function = !settings[Setting::object_storage_cluster].value.empty();
+
+    if (is_cluster_function)
+    {
+        ASTPtr cluster_name_arg = make_intrusive<ASTLiteral>(settings[Setting::object_storage_cluster].value);
+        args.insert(args.begin(), cluster_name_arg);
+        BaseCluster::parseArgumentsImpl(args, context);
+        args.erase(args.begin());
+    }
+    else
+        BaseSimple::parseArgumentsImpl(args, context); // NOLINT(bugprone-parent-virtual-call)
+}
+
+template <typename Definition, typename Base>
+StoragePtr TableFunctionObjectStorageClusterFallback<Definition, Base>::executeImpl(
+    const ASTPtr & ast_function,
+    ContextPtr context,
+    const std::string & table_name,
+    ColumnsDescription cached_columns,
+    bool is_insert_query) const
+{
+    if (is_cluster_function)
+    {
+        auto result = BaseCluster::executeImpl(ast_function, context, table_name, cached_columns, is_insert_query);
+        if (auto storage = typeid_cast<std::shared_ptr<StorageObjectStorageCluster>>(result))
+            storage->setClusterNameInSettings(true);
+        return result;
+    }
+    else
+        return BaseSimple::executeImpl(ast_function, context, table_name, cached_columns, is_insert_query); // NOLINT(bugprone-parent-virtual-call)
+}
+
+template <typename Definition, typename Base>
+void TableFunctionObjectStorageClusterFallback<Definition, Base>::validateUseToCreateTable() const
+{
+    if (is_cluster_function)
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Table function '{}' cannot be used to create a table in cluster mode",
+            getName());
+}
+
+#if USE_AWS_S3
+using TableFunctionS3ClusterFallback = TableFunctionObjectStorageClusterFallback<S3ClusterFallbackDefinition, TableFunctionS3Cluster>;
+#endif
+
+#if USE_AZURE_BLOB_STORAGE
+using TableFunctionAzureClusterFallback = TableFunctionObjectStorageClusterFallback<AzureClusterFallbackDefinition, TableFunctionAzureBlobCluster>;
+#endif
+
+#if USE_HDFS
+using TableFunctionHDFSClusterFallback = TableFunctionObjectStorageClusterFallback<HDFSClusterFallbackDefinition, TableFunctionHDFSCluster>;
+#endif
+
+#if USE_AVRO
+using TableFunctionIcebergClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergClusterFallbackDefinition, TableFunctionIcebergCluster>;
+#endif
+
+#if USE_AVRO && USE_AWS_S3
+using TableFunctionIcebergS3ClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergS3ClusterFallbackDefinition, TableFunctionIcebergS3Cluster>;
+#endif
+
+#if USE_AVRO && USE_AZURE_BLOB_STORAGE
+using TableFunctionIcebergAzureClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergAzureClusterFallbackDefinition, TableFunctionIcebergAzureCluster>;
+#endif
+
+#if USE_AVRO && USE_HDFS
+using TableFunctionIcebergHDFSClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergHDFSClusterFallbackDefinition, TableFunctionIcebergHDFSCluster>;
+#endif
+
+#if USE_AWS_S3 && USE_PARQUET && USE_DELTA_KERNEL_RS
+using TableFunctionDeltaLakeClusterFallback = TableFunctionObjectStorageClusterFallback<DeltaLakeClusterFallbackDefinition, TableFunctionDeltaLakeCluster>;
+using TableFunctionDeltaLakeS3ClusterFallback = TableFunctionObjectStorageClusterFallback<DeltaLakeS3ClusterFallbackDefinition, TableFunctionDeltaLakeS3Cluster>;
+#endif
+
+#if USE_AZURE_BLOB_STORAGE && USE_PARQUET && USE_DELTA_KERNEL_RS
+using TableFunctionDeltaLakeAzureClusterFallback = TableFunctionObjectStorageClusterFallback<DeltaLakeAzureClusterFallbackDefinition, TableFunctionDeltaLakeAzureCluster>;
+#endif
+
+#if USE_AWS_S3
+using TableFunctionHudiClusterFallback = TableFunctionObjectStorageClusterFallback<HudiClusterFallbackDefinition, TableFunctionHudiCluster>;
+#endif
+
+void registerTableFunctionObjectStorageClusterFallback(TableFunctionFactory & factory)
+{
+    UNUSED(factory);
+#if USE_AWS_S3
+    factory.registerFunction<TableFunctionS3ClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the data stored on S3 in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {"s3", "SELECT * FROM s3(url, format, structure)", ""},
+                {"s3", "SELECT * FROM s3(url, format, structure) SETTINGS object_storage_cluster='cluster'", ""}
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_AZURE_BLOB_STORAGE
+    factory.registerFunction<TableFunctionAzureClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the data stored on Azure Blob Storage in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "azureBlobStorage",
+                    "SELECT * FROM azureBlobStorage(connection_string|storage_account_url, container_name, blobpath, "
+                    "[account_name, account_key, format, compression, structure])", ""
+                },
+                {
+                    "azureBlobStorage",
+                    "SELECT * FROM azureBlobStorage(connection_string|storage_account_url, container_name, blobpath, "
+                    "[account_name, account_key, format, compression, structure]) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_HDFS
+    factory.registerFunction<TableFunctionHDFSClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the data stored on HDFS virtual filesystem in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "hdfs",
+                    "SELECT * FROM hdfs(url, format, compression, structure])", ""
+                },
+                {
+                    "hdfs",
+                    "SELECT * FROM hdfs(url, format, compression, structure]) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_AVRO
+    factory.registerFunction<TableFunctionIcebergClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Iceberg table stored on different object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "iceberg",
+                    "SELECT * FROM iceberg(url, access_key_id, secret_access_key, storage_type='s3')", ""
+                },
+                {
+                    "iceberg",
+                    "SELECT * FROM iceberg(url, access_key_id, secret_access_key, storage_type='s3') "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+                {
+                    "iceberg",
+                    "SELECT * FROM iceberg(url, access_key_id, secret_access_key, storage_type='azure')", ""
+                },
+                {
+                    "iceberg",
+                    "SELECT * FROM iceberg(url, storage_type='hdfs') SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_AVRO && USE_AWS_S3
+    factory.registerFunction<TableFunctionIcebergS3ClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Iceberg table stored on S3 object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "icebergS3",
+                    "SELECT * FROM icebergS3(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "icebergS3",
+                    "SELECT * FROM icebergS3(url, access_key_id, secret_access_key) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_AVRO && USE_AZURE_BLOB_STORAGE
+    factory.registerFunction<TableFunctionIcebergAzureClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Iceberg table stored on Azure object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "icebergAzure",
+                    "SELECT * FROM icebergAzure(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "icebergAzure",
+                    "SELECT * FROM icebergAzure(url, access_key_id, secret_access_key) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_AVRO && USE_HDFS
+    factory.registerFunction<TableFunctionIcebergHDFSClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Iceberg table stored on HDFS virtual filesystem in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "icebergHDFS",
+                    "SELECT * FROM icebergHDFS(url)", ""
+                },
+                {
+                    "icebergHDFS",
+                    "SELECT * FROM icebergHDFS(url) SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+
+#if USE_PARQUET && USE_DELTA_KERNEL_RS
+#   if USE_AWS_S3
+    factory.registerFunction<TableFunctionDeltaLakeClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the DeltaLake table stored on object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "deltaLake",
+                    "SELECT * FROM deltaLake(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "deltaLake",
+                    "SELECT * FROM deltaLake(url, access_key_id, secret_access_key) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+    factory.registerFunction<TableFunctionDeltaLakeS3ClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the DeltaLake table stored on object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "deltaLakeS3",
+                    "SELECT * FROM deltaLakeS3(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "deltaLakeS3",
+                    "SELECT * FROM deltaLakeS3(url, access_key_id, secret_access_key) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#   endif
+#   if USE_AZURE_BLOB_STORAGE
+    factory.registerFunction<TableFunctionDeltaLakeAzureClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the DeltaLake table stored on object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "deltaLakeAzure",
+                    "SELECT * FROM deltaLakeAzure(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "deltaLakeAzure",
+                    "SELECT * FROM deltaLakeAzure(url, access_key_id, secret_access_key) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#   endif
+#endif
+
+#if USE_AWS_S3
+    factory.registerFunction<TableFunctionHudiClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Hudi table stored on object store in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "hudi",
+                    "SELECT * FROM hudi(url, access_key_id, secret_access_key)", ""
+                },
+                {
+                    "hudi",
+                    "SELECT * FROM hudi(url, access_key_id, secret_access_key) SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
+#endif
+}
+
+}
diff --git a/src/TableFunctions/TableFunctionObjectStorageClusterFallback.h b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.h
new file mode 100644
index 000000000000..d81acac2be50
--- /dev/null
+++ b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.h
@@ -0,0 +1,49 @@
+#pragma once
+#include "config.h"
+#include <TableFunctions/TableFunctionObjectStorageCluster.h>
+
+namespace DB
+{
+
+/**
+* Class implementing s3/hdfs/azureBlobStorage(...) table functions,
+* which allow to use simple or distributed function variant based on settings.
+* If setting `object_storage_cluster` is empty,
+* simple single-host variant is used, if setting not empty, cluster variant is used.
+* `SELECT * FROM s3('s3://...', ...) SETTINGS object_storage_cluster='cluster'`
+* is equal to
+* `SELECT * FROM s3Cluster('cluster', 's3://...', ...)`
+*/
+
+template <typename Definition, typename Base>
+class TableFunctionObjectStorageClusterFallback : public Base
+{
+public:
+    using BaseCluster = Base;
+    using BaseSimple = BaseCluster::Base;
+
+    static constexpr auto name = Definition::name;
+
+    String getName() const override { return name; }
+
+    void validateUseToCreateTable() const override;
+
+private:
+    const char * getStorageEngineName() const override
+    {
+        return is_cluster_function ? Definition::storage_engine_cluster_name : Definition::storage_engine_name;
+    }
+
+    StoragePtr executeImpl(
+        const ASTPtr & ast_function,
+        ContextPtr context,
+        const std::string & table_name,
+        ColumnsDescription cached_columns,
+        bool is_insert_query) const override;
+
+    void parseArgumentsImpl(ASTs & args, const ContextPtr & context) override;
+
+    bool is_cluster_function = false;
+};
+
+}
diff --git a/src/TableFunctions/registerTableFunctions.cpp b/src/TableFunctions/registerTableFunctions.cpp
index bfd3bc69a13a..77723732080d 100644
--- a/src/TableFunctions/registerTableFunctions.cpp
+++ b/src/TableFunctions/registerTableFunctions.cpp
@@ -69,6 +69,7 @@ void registerTableFunctions()
 
     registerTableFunctionObjectStorage(factory);
     registerTableFunctionObjectStorageCluster(factory);
+    registerTableFunctionObjectStorageClusterFallback(factory);
     registerDataLakeTableFunctions(factory);
     registerDataLakeClusterTableFunctions(factory);
 
diff --git a/src/TableFunctions/registerTableFunctions.h b/src/TableFunctions/registerTableFunctions.h
index 9a4c19fbad14..49a65507cf9d 100644
--- a/src/TableFunctions/registerTableFunctions.h
+++ b/src/TableFunctions/registerTableFunctions.h
@@ -70,6 +70,7 @@ void registerTableFunctionExplain(TableFunctionFactory & factory);
 
 void registerTableFunctionObjectStorage(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorageCluster(TableFunctionFactory & factory);
+void registerTableFunctionObjectStorageClusterFallback(TableFunctionFactory & factory);
 void registerDataLakeTableFunctions(TableFunctionFactory & factory);
 void registerDataLakeClusterTableFunctions(TableFunctionFactory & factory);
 
diff --git a/tests/integration/helpers/iceberg_utils.py b/tests/integration/helpers/iceberg_utils.py
index a0b65b59a835..592b4415ccd4 100644
--- a/tests/integration/helpers/iceberg_utils.py
+++ b/tests/integration/helpers/iceberg_utils.py
@@ -200,8 +200,11 @@ def get_creation_expression(
     table_function=False,
     use_version_hint=False,
     run_on_cluster=False,
+    object_storage_cluster=False,
     explicit_metadata_path="",
     additional_settings = [],
+    storage_type_as_arg=False,
+    storage_type_in_named_collection=False,
     **kwargs,
 ):
     settings_array = list(additional_settings)
@@ -212,6 +215,9 @@ def get_creation_expression(
     if use_version_hint:
         settings_array.append("iceberg_use_version_hint = true")
 
+    if object_storage_cluster:
+        settings_array.append(f"object_storage_cluster = '{object_storage_cluster}'")
+
     if partition_by:
         partition_by = "PARTITION BY " + partition_by
 
@@ -228,6 +234,22 @@ def get_creation_expression(
     else:
         settings_expression = ""
 
+    storage_arg = storage_type
+    engine_part = ""
+    if (storage_type_in_named_collection):
+        storage_arg += "_with_type"
+    elif (storage_type_as_arg):
+        storage_arg += f", storage_type='{storage_type}'"
+    else:
+        if (storage_type == "s3"):
+            engine_part = "S3"
+        elif (storage_type == "azure"):
+            engine_part = "Azure"
+        elif (storage_type == "hdfs"):
+            engine_part = "HDFS"
+        elif (storage_type == "local"):
+            engine_part = "Local"
+
     if_not_exists_prefix = ""
     if if_not_exists:
         if_not_exists_prefix = "IF NOT EXISTS"
@@ -240,16 +262,16 @@ def get_creation_expression(
 
         if run_on_cluster:
             assert table_function
-            return f"icebergS3Cluster('cluster_simple', s3, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
+            return f"iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
         else:
             if table_function:
-                return f"icebergS3(s3, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
+                return f"iceberg{engine_part}({storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
             else:
                 return (
                     f"""
                     DROP TABLE IF EXISTS {table_name};
                     CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
-                    ENGINE=IcebergS3(s3, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')
+                    ENGINE=Iceberg{engine_part}({storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')
                     {order_by}
                     {partition_by}
                     {settings_expression};
@@ -260,19 +282,19 @@ def get_creation_expression(
         if run_on_cluster:
             assert table_function
             return f"""
-                icebergAzureCluster('cluster_simple', azure, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
             if table_function:
                 return f"""
-                    icebergAzure(azure, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                    iceberg{engine_part}({storage_arg}, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
                 """
             else:
                 return (
                     f"""
                     DROP TABLE IF EXISTS {table_name};
                     CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
-                    ENGINE=IcebergAzure(azure, container = {cluster.azure_container_name}, storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                    ENGINE=Iceberg{engine_part}({storage_arg}, container = {cluster.azure_container_name}, storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
                     {order_by}
                     {partition_by}
                     {settings_expression}
@@ -283,24 +305,19 @@ def get_creation_expression(
         if run_on_cluster:
             assert table_function
             return f"""
-                icebergLocalCluster('cluster_simple', local, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}', format={format})
+                iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
-            if table_function:
-                return f"""
-                    icebergLocal(local, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}', format={format})
+            return (
+                f"""
+                DROP TABLE IF EXISTS {table_name};
+                CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
+                ENGINE=Iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                {order_by}
+                {partition_by}
+                {settings_expression}
                 """
-            else:
-                return (
-                    f"""
-                    DROP TABLE IF EXISTS {table_name};
-                    CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
-                    ENGINE=IcebergLocal(local, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}', format={format})
-                    {order_by}
-                    {partition_by}
-                    {settings_expression}
-                    """
-                )
+            )
 
     else:
         raise Exception(f"Unknown iceberg storage type: {storage_type}")
@@ -386,16 +403,43 @@ def create_iceberg_table(
     run_on_cluster=False,
     format="Parquet",
     order_by="",
+    object_storage_cluster=False,
     **kwargs,
 ):
     if 'output_format_parquet_use_custom_encoder' in kwargs:
         node.query(
-            get_creation_expression(storage_type, table_name, cluster, schema, format_version, partition_by, if_not_exists, compression_method, format, order_by, run_on_cluster = run_on_cluster, **kwargs),
+            get_creation_expression(
+                storage_type,
+                table_name,
+                cluster,
+                schema,
+                format_version,
+                partition_by,
+                if_not_exists,
+                compression_method,
+                format,
+                order_by,
+                run_on_cluster=run_on_cluster,
+                object_storage_cluster=object_storage_cluster,
+                **kwargs),
             settings={"output_format_parquet_use_custom_encoder" : 0, "output_format_parquet_parallel_encoding" : 0}
         )
     else:
         node.query(
-            get_creation_expression(storage_type, table_name, cluster, schema, format_version, partition_by, if_not_exists, compression_method, format, order_by, run_on_cluster=run_on_cluster, **kwargs),
+            get_creation_expression(
+                storage_type,
+                table_name,
+                cluster,
+                schema,
+                format_version,
+                partition_by,
+                if_not_exists,
+                compression_method,
+                format,
+                order_by,
+                run_on_cluster=run_on_cluster,
+                object_storage_cluster=object_storage_cluster,
+                **kwargs),
         )
 
 
diff --git a/tests/integration/test_mask_sensitive_info/test.py b/tests/integration/test_mask_sensitive_info/test.py
index 4114d8f46add..b2fd3234d851 100644
--- a/tests/integration/test_mask_sensitive_info/test.py
+++ b/tests/integration/test_mask_sensitive_info/test.py
@@ -278,11 +278,13 @@ def test_create_table():
             f"IcebergS3('http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
             "DNS_ERROR",
         ),
+        (
+            f"Iceberg(storage_type='s3', 'http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
+            "DNS_ERROR",
+        ),
         f"AzureBlobStorage('{azure_conn_string}', 'cont', 'test_simple.csv', 'CSV')",
         f"AzureBlobStorage('{azure_conn_string}', 'cont', 'test_simple_1.csv', 'CSV', 'none')",
-        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_2.csv', '{azure_account_name}', '{azure_account_key}')",
-        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_3.csv', '{azure_account_name}', '{azure_account_key}', 'CSV')",
-        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none')",
+
         f"AzureQueue('{azure_conn_string}', 'cont', '*', 'CSV') SETTINGS mode = 'unordered'",
         f"AzureQueue('{azure_conn_string}', 'cont', '*', 'CSV', 'none') SETTINGS mode = 'unordered'",
         f"AzureQueue('{azure_conn_string}', 'cont', '*', 'CSV') SETTINGS mode = 'unordered', after_processing = 'move', after_processing_move_connection_string = '{azure_conn_string}', after_processing_move_container = 'chprocessed'",
@@ -293,6 +295,45 @@ def test_create_table():
             f"AzureBlobStorage('BlobEndpoint=https://my-endpoint/;SharedAccessSignature=sp=r&st=2025-09-29T14:58:11Z&se=2025-09-29T00:00:00Z&spr=https&sv=2022-11-02&sr=c&sig=SECRET%SECRET%SECRET%SECRET', 'exampledatasets', 'example.csv')",
             "STD_EXCEPTION",
         ),
+
+        f"AzureBlobStorage(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+        f"AzureBlobStorage(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_3.csv', '{azure_account_name}', '{azure_account_key}')",
+        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '{azure_account_key}', 'CSV')",
+        f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none')",
+        (
+            f"IcebergAzure('{azure_conn_string}', 'cont', 'test_simple.csv')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"IcebergAzure(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"Iceberg(storage_type='azure', '{azure_conn_string}', 'cont', 'test_simple.csv')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"Iceberg(storage_type='azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"Iceberg(storage_type='azure', named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+            "FILE_DOESNT_EXIST",
+        ),
+        (
+            f"Iceberg(storage_type='azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+            "FILE_DOESNT_EXIST",
+        ),
+
         f"Kafka() SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '{password}', format_avro_schema_registry_url = 'http://schema_user:{password}@'",
         f"Kafka() SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '{password}', format_avro_schema_registry_url = 'http://schema_user:{password}@domain.com'",
         f"S3('http://minio1:9001/root/data/test5.csv.gz', 'CSV', access_key_id = 'minio', secret_access_key = '{password}', compression_method = 'gzip')",
@@ -374,11 +415,9 @@ def generate_create_table_numbered(tail):
             generate_create_table_numbered("(`x` int) ENGINE = S3Queue('http://minio1:9001/root/data/', 'CSV') SETTINGS mode = 'ordered', after_processing = 'move', after_processing_move_uri = 'http://minio1:9001/chprocessed', after_processing_move_access_key_id = 'minio', after_processing_move_secret_access_key = '[HIDDEN]'"),
             generate_create_table_numbered("(`x` int) ENGINE = Iceberg('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')"),
             generate_create_table_numbered("(`x` int) ENGINE = IcebergS3('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')"),
+            generate_create_table_numbered("(`x` int) ENGINE = Iceberg(storage_type = 's3', 'http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{masked_azure_conn_string}', 'cont', 'test_simple.csv', 'CSV')"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{masked_azure_conn_string}', 'cont', 'test_simple_1.csv', 'CSV', 'none')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_2.csv', '{azure_account_name}', '[HIDDEN]')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_3.csv', '{azure_account_name}', '[HIDDEN]', 'CSV')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none')"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureQueue('{masked_azure_conn_string}', 'cont', '*', 'CSV') SETTINGS mode = 'unordered'"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureQueue('{masked_azure_conn_string}', 'cont', '*', 'CSV', 'none') SETTINGS mode = 'unordered'"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureQueue('{masked_azure_conn_string}', 'cont', '*', 'CSV') SETTINGS mode = 'unordered', after_processing = 'move', after_processing_move_connection_string = '{masked_azure_conn_string}', after_processing_move_container = 'chprocessed'",),
@@ -386,6 +425,19 @@ def generate_create_table_numbered(tail):
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureQueue('{azure_storage_account_url}', 'cont', '*', '{azure_account_name}', '[HIDDEN]', 'CSV') SETTINGS mode = 'unordered'"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureQueue('{azure_storage_account_url}', 'cont', '*', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none') SETTINGS mode = 'unordered'"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{masked_sas_conn_string}', 'exampledatasets', 'example.csv')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_3.csv', '{azure_account_name}', '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '[HIDDEN]', 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure('{masked_azure_conn_string}', 'cont', 'test_simple.csv')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{masked_azure_conn_string}', 'cont', 'test_simple.csv')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
             generate_create_table_numbered("(`x` int) ENGINE = Kafka SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '[HIDDEN]', format_avro_schema_registry_url = 'http://schema_user:[HIDDEN]@'"),
             generate_create_table_numbered("(`x` int) ENGINE = Kafka SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '[HIDDEN]', format_avro_schema_registry_url = 'http://schema_user:[HIDDEN]@domain.com'"),
             generate_create_table_numbered("(`x` int) ENGINE = S3('http://minio1:9001/root/data/test5.csv.gz', 'CSV', access_key_id = 'minio', secret_access_key = '[HIDDEN]', compression_method = 'gzip')"),
@@ -512,9 +564,22 @@ def test_table_functions():
         f"azureBlobStorage(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
         f"azureBlobStorage(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
         f"iceberg('http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
-        f"gcs('http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
+        f"iceberg(named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '{password}')",
         f"icebergS3('http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
+        f"icebergS3(named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '{password}')",
+        f"icebergAzure('{azure_conn_string}', 'cont', 'test_simple.csv')",
+        f"icebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
         f"icebergAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none', 'auto')",
+        f"icebergAzure(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+        f"icebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+        f"iceberg(storage_type='s3', 'http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
+        f"iceberg(storage_type='s3', named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '{password}')",
+        f"iceberg(storage_type='azure', '{azure_conn_string}', 'cont', 'test_simple.csv')",
+        f"iceberg(storage_type='azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
+        f"iceberg(storage_type='azure', '{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none', 'auto')",
+        f"iceberg(storage_type='azure', named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+        f"iceberg(storage_type='azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+        f"gcs('http://minio1:9001/root/data/test11.csv.gz', 'minio', '{password}')",
         f"deltaLakeAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none', 'auto')",
         f"hudi('http://minio1:9001/root/data/test7.csv', 'minio', '{password}')",
         f"arrowFlight('arrowflight1:5006', 'dataset', 'arrowflight_user', '{password}')",
@@ -605,16 +670,29 @@ def make_test_case(i):
             f"CREATE TABLE tablefunc37 (`x` int) AS azureBlobStorage(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
             f"CREATE TABLE tablefunc38 (`x` int) AS azureBlobStorage(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')",
             "CREATE TABLE tablefunc39 (`x` int) AS iceberg('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')",
-            "CREATE TABLE tablefunc40 (`x` int) AS gcs('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')",
+            "CREATE TABLE tablefunc40 (`x` int) AS iceberg(named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '[HIDDEN]')",
             "CREATE TABLE tablefunc41 (`x` int) AS icebergS3('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')",
-            f"CREATE TABLE tablefunc42 (`x` int) AS icebergAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none', 'auto')",
-            f"CREATE TABLE tablefunc43 (`x` int) AS deltaLakeAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none', 'auto')",
-            "CREATE TABLE tablefunc44 (`x` int) AS hudi('http://minio1:9001/root/data/test7.csv', 'minio', '[HIDDEN]')",
-            "CREATE TABLE tablefunc45 (`x` int) AS arrowFlight('arrowflight1:5006', 'dataset', 'arrowflight_user', '[HIDDEN]')",
-            "CREATE TABLE tablefunc46 (`x` int) AS arrowFlight(named_collection_1, host = 'arrowflight1', port = 5006, dataset = 'dataset', username = 'arrowflight_user', password = '[HIDDEN]')",
-            "CREATE TABLE tablefunc47 (`x` int) AS arrowflight(named_collection_1, host = 'arrowflight1', port = 5006, dataset = 'dataset', username = 'arrowflight_user', password = '[HIDDEN]')",
-            "CREATE TABLE tablefunc48 (`x` int) AS url('https://username:[HIDDEN]@domain.com/path', 'CSV')",
-            "CREATE TABLE tablefunc49 (`x` int) AS redis('localhost', 'key', 'key Int64', 0, '[HIDDEN]')",
+            "CREATE TABLE tablefunc42 (`x` int) AS icebergS3(named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '[HIDDEN]')",
+            f"CREATE TABLE tablefunc43 (`x` int) AS icebergAzure('{masked_azure_conn_string}', 'cont', 'test_simple.csv')",
+            f"CREATE TABLE tablefunc44 (`x` int) AS icebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')",
+            f"CREATE TABLE tablefunc45 (`x` int) AS icebergAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none', 'auto')",
+            f"CREATE TABLE tablefunc46 (`x` int) AS icebergAzure(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+            f"CREATE TABLE tablefunc47 (`x` int) AS icebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')",
+            "CREATE TABLE tablefunc48 (`x` int) AS iceberg(storage_type = 's3', 'http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')",
+            "CREATE TABLE tablefunc49 (`x` int) AS iceberg(storage_type = 's3', named_collection_2, url = 'http://minio1:9001/root/data/test4.csv', access_key_id = 'minio', secret_access_key = '[HIDDEN]')",
+            f"CREATE TABLE tablefunc50 (`x` int) AS iceberg(storage_type = 'azure', '{masked_azure_conn_string}', 'cont', 'test_simple.csv')",
+            f"CREATE TABLE tablefunc51 (`x` int) AS iceberg(storage_type = 'azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')",
+            f"CREATE TABLE tablefunc52 (`x` int) AS iceberg(storage_type = 'azure', '{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none', 'auto')",
+            f"CREATE TABLE tablefunc53 (`x` int) AS iceberg(storage_type = 'azure', named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
+            f"CREATE TABLE tablefunc54 (`x` int) AS iceberg(storage_type = 'azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')",
+            "CREATE TABLE tablefunc55 (`x` int) AS gcs('http://minio1:9001/root/data/test11.csv.gz', 'minio', '[HIDDEN]')",
+            f"CREATE TABLE tablefunc56 (`x` int) AS deltaLakeAzure('{azure_storage_account_url}', 'cont', 'test_simple_6.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none', 'auto')",
+            "CREATE TABLE tablefunc57 (`x` int) AS hudi('http://minio1:9001/root/data/test7.csv', 'minio', '[HIDDEN]')",
+            "CREATE TABLE tablefunc58 (`x` int) AS arrowFlight('arrowflight1:5006', 'dataset', 'arrowflight_user', '[HIDDEN]')",
+            "CREATE TABLE tablefunc59 (`x` int) AS arrowFlight(named_collection_1, host = 'arrowflight1', port = 5006, dataset = 'dataset', username = 'arrowflight_user', password = '[HIDDEN]')",
+            "CREATE TABLE tablefunc60 (`x` int) AS arrowflight(named_collection_1, host = 'arrowflight1', port = 5006, dataset = 'dataset', username = 'arrowflight_user', password = '[HIDDEN]')",
+            "CREATE TABLE tablefunc61 (`x` int) AS url('https://username:[HIDDEN]@domain.com/path', 'CSV')",
+            "CREATE TABLE tablefunc62 (`x` int) AS redis('localhost', 'key', 'key Int64', 0, '[HIDDEN]')",
         ],
         must_not_contain=[password],
     )
diff --git a/tests/integration/test_s3_cluster/test.py b/tests/integration/test_s3_cluster/test.py
index 76b8f0df2881..1153ecfc0794 100644
--- a/tests/integration/test_s3_cluster/test.py
+++ b/tests/integration/test_s3_cluster/test.py
@@ -2,8 +2,7 @@
 import logging
 import os
 import shutil
-import time
-from email.errors import HeaderParseError
+import uuid
 
 import pytest
 
@@ -234,6 +233,21 @@ def test_wrong_cluster(started_cluster):
 
     assert "not found" in error
 
+    error = node.query_and_get_error(
+        f"""
+    SELECT count(*) from s3(
+        'http://minio1:9001/root/data/{{clickhouse,database}}/*',
+        'minio', '{minio_secret_key}', 'CSV', 'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))')
+    UNION ALL
+    SELECT count(*) from s3(
+        'http://minio1:9001/root/data/{{clickhouse,database}}/*',
+        'minio', '{minio_secret_key}', 'CSV', 'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))')
+    SETTINGS object_storage_cluster = 'non_existing_cluster'
+    """
+    )
+
+    assert "not found" in error
+
 
 def test_ambiguous_join(started_cluster):
     node = started_cluster.instances["s0_0_0"]
@@ -252,6 +266,20 @@ def test_ambiguous_join(started_cluster):
     )
     assert "AMBIGUOUS_COLUMN_NAME" not in result
 
+    result = node.query(
+        f"""
+    SELECT l.name, r.value from s3(
+        'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+        'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') as l
+    JOIN s3(
+        'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+        'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') as r
+    ON l.name = r.name
+    SETTINGS object_storage_cluster = 'cluster_simple'
+    """
+    )
+    assert "AMBIGUOUS_COLUMN_NAME" not in result
+
 
 def test_skip_unavailable_shards(started_cluster):
     node = started_cluster.instances["s0_0_0"]
@@ -267,6 +295,17 @@ def test_skip_unavailable_shards(started_cluster):
 
     assert result == "10\n"
 
+    result = node.query(
+        f"""
+    SELECT count(*) from s3(
+        'http://minio1:9001/root/data/clickhouse/part1.csv',
+        'minio', '{minio_secret_key}', 'CSV', 'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))')
+    SETTINGS skip_unavailable_shards = 1, object_storage_cluster = 'cluster_non_existent_port'
+    """
+    )
+
+    assert result == "10\n"
+
 
 def test_unset_skip_unavailable_shards(started_cluster):
     # Although skip_unavailable_shards is not set, cluster table functions should always skip unavailable shards.
@@ -282,6 +321,17 @@ def test_unset_skip_unavailable_shards(started_cluster):
 
     assert result == "10\n"
 
+    result = node.query(
+        f"""
+    SELECT count(*) from s3(
+        'http://minio1:9001/root/data/clickhouse/part1.csv',
+        'minio', '{minio_secret_key}', 'CSV', 'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))')
+    SETTINGS object_storage_cluster = 'cluster_non_existent_port'
+    """
+    )
+
+    assert result == "10\n"
+
 
 def test_distributed_insert_select_with_replicated(started_cluster):
     first_replica_first_shard = started_cluster.instances["s0_0_0"]
@@ -462,6 +512,18 @@ def test_cluster_format_detection(started_cluster):
 
     assert result == expected_result
 
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/generated/*', 'minio', '{minio_secret_key}') order by c1, c2 SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/generated/*', 'minio', '{minio_secret_key}', auto, 'a String, b UInt64') order by a, b SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
 
 def test_cluster_default_expression(started_cluster):
     node = started_cluster.instances["s0_0_0"]
@@ -509,3 +571,262 @@ def test_cluster_default_expression(started_cluster):
     )
 
     assert result == expected_result
+
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/data{{1,2,3}}', 'minio', '{minio_secret_key}', 'JSONEachRow', 'id UInt32, date Date DEFAULT 18262') order by id SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/data{{1,2,3}}', 'minio', '{minio_secret_key}', 'auto', 'id UInt32, date Date DEFAULT 18262') order by id SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/data{{1,2,3}}', 'minio', '{minio_secret_key}', 'JSONEachRow', 'id UInt32, date Date DEFAULT 18262', 'auto') order by id SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        f"SELECT * FROM s3('http://minio1:9001/root/data/data{{1,2,3}}', 'minio', '{minio_secret_key}', 'auto', 'id UInt32, date Date DEFAULT 18262', 'auto') order by id SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        "SELECT * FROM s3(test_s3_with_default) order by id SETTINGS object_storage_cluster = 'cluster_simple'"
+    )
+
+    assert result == expected_result
+
+
+def test_distributed_s3_table_engine(started_cluster):
+    node = started_cluster.instances["s0_0_0"]
+
+    resp_def = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+        """
+    )
+
+    node.query("DROP TABLE IF EXISTS single_node");
+    node.query(
+        f"""
+        CREATE TABLE single_node
+            (name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64))))
+            ENGINE=S3('http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV')
+        """
+    )
+    query_id_engine_single_node = str(uuid.uuid4())
+    resp_engine_single_node = node.query(
+        """
+        SELECT * FROM single_node ORDER BY (name, value, polygon)
+        """,
+        query_id = query_id_engine_single_node
+    )
+    assert resp_def == resp_engine_single_node
+
+    node.query("DROP TABLE IF EXISTS distributed");
+    node.query(
+       f"""
+        CREATE TABLE distributed
+            (name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64))))
+            ENGINE=S3('http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV')
+            SETTINGS object_storage_cluster='cluster_simple'
+        """
+    )
+    query_id_engine_distributed = str(uuid.uuid4())
+    resp_engine_distributed = node.query(
+        """
+        SELECT * FROM distributed ORDER BY (name, value, polygon)
+        """,
+        query_id = query_id_engine_distributed
+    )
+    assert resp_def == resp_engine_distributed
+
+    node.query("SYSTEM FLUSH LOGS ON CLUSTER 'cluster_simple'")
+
+    hosts_engine_single_node = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_engine_single_node}'
+        """
+    )
+    assert int(hosts_engine_single_node) == 1
+    hosts_engine_distributed = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_engine_distributed}'
+        """
+    )
+    assert int(hosts_engine_distributed) == 3
+
+
+def test_distributed_s3_table_engine(started_cluster):
+    node = started_cluster.instances["s0_0_0"]
+
+    resp_def = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+        """
+    )
+
+    node.query("DROP TABLE IF EXISTS single_node");
+    node.query(
+        f"""
+        CREATE TABLE single_node
+            (name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64))))
+            ENGINE=S3('http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV')
+        """
+    )
+    query_id_engine_single_node = str(uuid.uuid4())
+    resp_engine_single_node = node.query(
+        """
+        SELECT * FROM single_node ORDER BY (name, value, polygon)
+        """,
+        query_id = query_id_engine_single_node
+    )
+    assert resp_def == resp_engine_single_node
+
+    node.query("DROP TABLE IF EXISTS distributed");
+    node.query(
+        f"""
+        CREATE TABLE distributed
+            (name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64))))
+            ENGINE=S3('http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV')
+            SETTINGS object_storage_cluster='cluster_simple'
+        """
+    )
+    query_id_engine_distributed = str(uuid.uuid4())
+    resp_engine_distributed = node.query(
+        """
+        SELECT * FROM distributed ORDER BY (name, value, polygon)
+        """,
+        query_id = query_id_engine_distributed
+    )
+    assert resp_def == resp_engine_distributed
+
+    node.query("SYSTEM FLUSH LOGS ON CLUSTER 'cluster_simple'")
+
+    hosts_engine_single_node = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_engine_single_node}'
+        """
+    )
+    assert int(hosts_engine_single_node) == 1
+    hosts_engine_distributed = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_engine_distributed}'
+        """
+    )
+    assert int(hosts_engine_distributed) == 3
+
+
+def test_cluster_hosts_limit(started_cluster):
+    node = started_cluster.instances["s0_0_0"]
+
+    query_id_def = str(uuid.uuid4())
+    resp_def = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+        """,
+        query_id = query_id_def
+    )
+
+    #  object_storage_max_nodes is greater than number of hosts in cluster
+    query_id_4_hosts = str(uuid.uuid4())
+    resp_4_hosts = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+            SETTINGS object_storage_max_nodes=4
+        """,
+        query_id = query_id_4_hosts
+    )
+    assert resp_def == resp_4_hosts
+
+    #  object_storage_max_nodes is equal number of hosts in cluster
+    query_id_3_hosts = str(uuid.uuid4())
+    resp_3_hosts = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+            SETTINGS object_storage_max_nodes=3
+        """,
+        query_id = query_id_3_hosts
+    )
+    assert resp_def == resp_3_hosts
+
+    #  object_storage_max_nodes is less than number of hosts in cluster
+    query_id_2_hosts = str(uuid.uuid4())
+    resp_2_hosts = node.query(
+        f"""
+        SELECT * from s3Cluster(
+            'cluster_simple',
+            'http://minio1:9001/root/data/{{clickhouse,database}}/*', 'minio', '{minio_secret_key}', 'CSV',
+            'name String, value UInt32, polygon Array(Array(Tuple(Float64, Float64)))') ORDER BY (name, value, polygon)
+            SETTINGS object_storage_max_nodes=2
+        """,
+        query_id = query_id_2_hosts
+    )
+    assert resp_def == resp_2_hosts
+
+    node.query("SYSTEM FLUSH LOGS ON CLUSTER 'cluster_simple'")
+
+    hosts_def = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_def}' AND query_id!='{query_id_def}'
+        """
+    )
+    assert int(hosts_def) == 3
+
+    hosts_4 = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_4_hosts}' AND query_id!='{query_id_4_hosts}'
+        """
+    )
+    assert int(hosts_4) == 3
+
+    hosts_3 = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_3_hosts}' AND query_id!='{query_id_3_hosts}'
+        """
+    )
+    assert int(hosts_3) == 3
+
+    hosts_2 = node.query(
+        f"""
+        SELECT uniq(hostname)
+            FROM clusterAllReplicas('cluster_simple', system.query_log)
+            WHERE type='QueryFinish' AND initial_query_id='{query_id_2_hosts}' AND query_id!='{query_id_2_hosts}'
+        """
+    )
+    assert int(hosts_2) == 2
diff --git a/tests/integration/test_storage_iceberg_no_spark/configs/config.d/named_collections.xml b/tests/integration/test_storage_iceberg_no_spark/configs/config.d/named_collections.xml
index 516e4ba63a3a..7dfec41b2df8 100644
--- a/tests/integration/test_storage_iceberg_no_spark/configs/config.d/named_collections.xml
+++ b/tests/integration/test_storage_iceberg_no_spark/configs/config.d/named_collections.xml
@@ -11,5 +11,19 @@
     </azure>
     <local>
     </local>
+    <s3_with_type>
+        <url>http://minio1:9001/root/</url>
+        <access_key_id>minio</access_key_id>
+        <secret_access_key>ClickHouse_Minio_P@ssw0rd</secret_access_key>
+        <storage_type>s3</storage_type>
+    </s3_with_type>
+    <azure_with_type>
+        <account_name>devstoreaccount1</account_name>
+        <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
+        <storage_type>azure</storage_type>
+    </azure_with_type>
+    <local_with_type>
+        <storage_type>local</storage_type>
+    </local_with_type>
   </named_collections>
 </clickhouse>
diff --git a/tests/integration/test_storage_iceberg_with_spark/configs/config.d/named_collections.xml b/tests/integration/test_storage_iceberg_with_spark/configs/config.d/named_collections.xml
index 516e4ba63a3a..7dfec41b2df8 100644
--- a/tests/integration/test_storage_iceberg_with_spark/configs/config.d/named_collections.xml
+++ b/tests/integration/test_storage_iceberg_with_spark/configs/config.d/named_collections.xml
@@ -11,5 +11,19 @@
     </azure>
     <local>
     </local>
+    <s3_with_type>
+        <url>http://minio1:9001/root/</url>
+        <access_key_id>minio</access_key_id>
+        <secret_access_key>ClickHouse_Minio_P@ssw0rd</secret_access_key>
+        <storage_type>s3</storage_type>
+    </s3_with_type>
+    <azure_with_type>
+        <account_name>devstoreaccount1</account_name>
+        <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
+        <storage_type>azure</storage_type>
+    </azure_with_type>
+    <local_with_type>
+        <storage_type>local</storage_type>
+    </local_with_type>
   </named_collections>
 </clickhouse>
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
index 56fc76859d5e..7250700e2726 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
@@ -18,6 +18,26 @@
 from helpers.config_cluster import minio_secret_key
 
 
+def count_secondary_subqueries(started_cluster, query_id, expected, comment):
+    for node_name, replica in started_cluster.instances.items():
+        cluster_secondary_queries = (
+            replica.query(
+                f"""
+                SELECT count(*) FROM system.query_log
+                WHERE
+                    type = 'QueryFinish'
+                    AND NOT is_initial_query
+                    AND initial_query_id='{query_id}'
+            """
+            )
+            .strip()
+        )
+
+        logging.info(
+            f"[{node_name}] cluster_secondary_queries {comment}: {cluster_secondary_queries}"
+        )
+        assert int(cluster_secondary_queries) == expected
+
 @pytest.mark.parametrize("format_version", ["1", "2"])
 @pytest.mark.parametrize("storage_type", ["s3", "azure", "local"])
 def test_cluster_table_function(started_cluster_iceberg_with_spark, format_version, storage_type):
@@ -84,54 +104,156 @@ def add_df(mode):
         instance.query(f"SELECT * FROM {table_function_expr}").strip().split()
     )
 
+    def make_query_from_function(
+            run_on_cluster=False,
+            alt_syntax=False,
+            remote=False,
+            storage_type_as_arg=False,
+            storage_type_in_named_collection=False,
+            ):
+        expr = get_creation_expression(
+            storage_type,
+            TABLE_NAME,
+            started_cluster_iceberg_with_spark,
+            table_function=True,
+            run_on_cluster=run_on_cluster,
+            storage_type_as_arg=storage_type_as_arg,
+            storage_type_in_named_collection=storage_type_in_named_collection,
+        )
+        query_id = str(uuid.uuid4())
+        settings = "SETTINGS object_storage_cluster='cluster_simple'" if alt_syntax else ""
+        if remote:
+            query = f"SELECT * FROM remote('node2', {expr}) {settings}"
+        else:
+            query = f"SELECT * FROM {expr} {settings}"
+        responce = instance.query(query, query_id=query_id).strip().split()
+        return responce, query_id
+
     # Cluster Query with node1 as coordinator
-    table_function_expr_cluster = get_creation_expression(
-        storage_type,
-        TABLE_NAME,
-        started_cluster_iceberg_with_spark,
-        table_function=True,
+    select_cluster, query_id_cluster = make_query_from_function(run_on_cluster=True)
+
+    # Cluster Query with node1 as coordinator with alternative syntax
+    select_cluster_alt_syntax, query_id_cluster_alt_syntax = make_query_from_function(
+        run_on_cluster=True,
+        alt_syntax=True)
+
+    # Cluster Query with node1 as coordinator and storage type as arg
+    select_cluster_with_type_arg, query_id_cluster_with_type_arg = make_query_from_function(
         run_on_cluster=True,
+        storage_type_as_arg=True,
     )
-    select_cluster = (
-        instance.query(f"SELECT * FROM {table_function_expr_cluster}").strip().split()
+
+    # Cluster Query with node1 as coordinator and storage type in named collection
+    select_cluster_with_type_in_nc, query_id_cluster_with_type_in_nc = make_query_from_function(
+        run_on_cluster=True,
+        storage_type_in_named_collection=True,
     )
 
+    # Cluster Query with node1 as coordinator and storage type as arg, alternative syntax
+    select_cluster_with_type_arg_alt_syntax, query_id_cluster_with_type_arg_alt_syntax = make_query_from_function(
+        storage_type_as_arg=True,
+        alt_syntax=True,
+    )
+
+    # Cluster Query with node1 as coordinator and storage type in named collection, alternative syntax
+    select_cluster_with_type_in_nc_alt_syntax, query_id_cluster_with_type_in_nc_alt_syntax = make_query_from_function(
+        storage_type_in_named_collection=True,
+        alt_syntax=True,
+    )
+
+    #select_remote_cluster, _ = make_query_from_function(run_on_cluster=True, remote=True)
+
+    def make_query_from_table(alt_syntax=False):
+        query_id = str(uuid.uuid4())
+        settings = "SETTINGS object_storage_cluster='cluster_simple'" if alt_syntax else ""
+        responce = (
+            instance.query(
+                f"SELECT * FROM {TABLE_NAME} {settings}",
+                query_id=query_id,
+            )
+            .strip()
+            .split()
+        )
+        return responce, query_id
+
+    create_iceberg_table(storage_type, instance, TABLE_NAME, started_cluster_iceberg_with_spark, object_storage_cluster='cluster_simple')
+    select_cluster_table_engine, query_id_cluster_table_engine = make_query_from_table()
+
+    #select_remote_cluster = (
+    #    instance.query(f"SELECT * FROM remote('node2',{table_function_expr_cluster})")
+    #    .strip()
+    #    .split()
+    #)
+
+    instance.query(f"DROP TABLE IF EXISTS `{TABLE_NAME}` SYNC")
+
+    create_iceberg_table(storage_type, instance, TABLE_NAME, started_cluster_iceberg_with_spark)
+    select_pure_table_engine, query_id_pure_table_engine = make_query_from_table()
+    select_pure_table_engine_cluster, query_id_pure_table_engine_cluster = make_query_from_table(alt_syntax=True)
+
+    create_iceberg_table(storage_type, instance, TABLE_NAME, started_cluster_iceberg_with_spark, storage_type_as_arg=True)
+    select_pure_table_engine_with_type_arg, query_id_pure_table_engine_with_type_arg = make_query_from_table()
+    select_pure_table_engine_cluster_with_type_arg, query_id_pure_table_engine_cluster_with_type_arg = make_query_from_table(alt_syntax=True)
+
+    create_iceberg_table(storage_type, instance, TABLE_NAME, started_cluster_iceberg_with_spark, storage_type_in_named_collection=True)
+    select_pure_table_engine_with_type_in_nc, query_id_pure_table_engine_with_type_in_nc = make_query_from_table()
+    select_pure_table_engine_cluster_with_type_in_nc, query_id_pure_table_engine_cluster_with_type_in_nc = make_query_from_table(alt_syntax=True)
+
     # Simple size check
     assert len(select_regular) == 600
     assert len(select_cluster) == 600
+    assert len(select_cluster_alt_syntax) == 600
+    assert len(select_cluster_table_engine) == 600
+    #assert len(select_remote_cluster) == 600
+    assert len(select_cluster_with_type_arg) == 600
+    assert len(select_cluster_with_type_in_nc) == 600
+    assert len(select_cluster_with_type_arg_alt_syntax) == 600
+    assert len(select_cluster_with_type_in_nc_alt_syntax) == 600
+    assert len(select_pure_table_engine) == 600
+    assert len(select_pure_table_engine_cluster) == 600
+    assert len(select_pure_table_engine_with_type_arg) == 600
+    assert len(select_pure_table_engine_cluster_with_type_arg) == 600
+    assert len(select_pure_table_engine_with_type_in_nc) == 600
+    assert len(select_pure_table_engine_cluster_with_type_in_nc) == 600
 
     # Actual check
     assert select_cluster == select_regular
+    assert select_cluster_alt_syntax == select_regular
+    assert select_cluster_table_engine == select_regular
+    #assert select_remote_cluster == select_regular
+    assert select_cluster_with_type_arg == select_regular
+    assert select_cluster_with_type_in_nc == select_regular
+    assert select_cluster_with_type_arg_alt_syntax == select_regular
+    assert select_cluster_with_type_in_nc_alt_syntax == select_regular
+    assert select_pure_table_engine == select_regular
+    assert select_pure_table_engine_cluster == select_regular
+    assert select_pure_table_engine_with_type_arg == select_regular
+    assert select_pure_table_engine_cluster_with_type_arg == select_regular
+    assert select_pure_table_engine_with_type_in_nc == select_regular
+    assert select_pure_table_engine_cluster_with_type_in_nc == select_regular
 
     # Check query_log
     for replica in started_cluster_iceberg_with_spark.instances.values():
         replica.query("SYSTEM FLUSH LOGS")
 
-    for node_name, replica in started_cluster_iceberg_with_spark.instances.items():
-        cluster_secondary_queries = (
-            replica.query(
-                f"""
-                SELECT query, type, is_initial_query, read_rows, read_bytes FROM system.query_log
-                WHERE
-                    type = 'QueryStart' AND
-                    positionCaseInsensitive(query, '{storage_type}Cluster') != 0 AND
-                    position(query, '{TABLE_NAME}') != 0 AND
-                    position(query, 'system.query_log') = 0 AND
-                    NOT is_initial_query
-            """
-            )
-            .strip()
-            .split("\n")
-        )
-
-        logging.info(
-            f"[{node_name}] cluster_secondary_queries: {cluster_secondary_queries}"
-        )
-        assert len(cluster_secondary_queries) == 1
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster, 1, "table function")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_alt_syntax, 1, "table function alt syntax")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_table_engine, 1, "cluster table engine")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_with_type_arg, 1, "table function with storage type in args")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_with_type_in_nc, 1, "table function with storage type in named collection")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_with_type_arg_alt_syntax, 1, "table function with storage type in args alt syntax")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_cluster_with_type_in_nc_alt_syntax, 1, "table function with storage type in named collection alt syntax")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine, 0, "table engine")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_cluster, 1, "table engine with cluster setting")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_with_type_arg, 0, "table engine with storage type in args")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_cluster_with_type_arg, 1, "table engine with cluster setting with storage type in args")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_with_type_in_nc, 0, "table engine with storage type in named collection")
+    count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_cluster_with_type_in_nc, 1, "table engine with cluster setting with storage type in named collection")
 
     # write 3 times
     assert int(instance.query(f"SELECT count() FROM {table_function_expr_cluster}")) == 100 * 3
 
+
 @pytest.mark.parametrize("format_version", ["1", "2"])
 @pytest.mark.parametrize("storage_type", ["s3", "azure"])
 def test_writes_cluster_table_function(started_cluster_iceberg_with_spark, format_version, storage_type):
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_types.py b/tests/integration/test_storage_iceberg_with_spark/test_types.py
index 8ca675d76887..7df6cda3dcf6 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_types.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_types.py
@@ -86,3 +86,49 @@ def test_types(started_cluster_iceberg_with_spark, format_version, storage_type)
             ["e", "Nullable(Bool)"],
         ]
     )
+
+    # Test storage type as function argument
+    table_function_expr = get_creation_expression(
+        storage_type,
+        TABLE_NAME,
+        started_cluster_iceberg_with_spark,
+        table_function=True,
+        storage_type_as_arg=True,
+    )
+    assert (
+        instance.query(f"SELECT a, b, c, d, e FROM {table_function_expr}").strip()
+        == "123\tstring\t2000-01-01\t['str1','str2']\ttrue"
+    )
+
+    assert instance.query(f"DESCRIBE {table_function_expr} FORMAT TSV") == TSV(
+        [
+            ["a", "Nullable(Int32)"],
+            ["b", "Nullable(String)"],
+            ["c", "Nullable(Date)"],
+            ["d", "Array(Nullable(String))"],
+            ["e", "Nullable(Bool)"],
+        ]
+    )
+
+    # Test storage type as field in named collection
+    table_function_expr = get_creation_expression(
+        storage_type,
+        TABLE_NAME,
+        started_cluster_iceberg_with_spark,
+        table_function=True,
+        storage_type_in_named_collection=True,
+    )
+    assert (
+        instance.query(f"SELECT a, b, c, d, e FROM {table_function_expr}").strip()
+        == "123\tstring\t2000-01-01\t['str1','str2']\ttrue"
+    )
+
+    assert instance.query(f"DESCRIBE {table_function_expr} FORMAT TSV") == TSV(
+        [
+            ["a", "Nullable(Int32)"],
+            ["b", "Nullable(String)"],
+            ["c", "Nullable(Date)"],
+            ["d", "Array(Nullable(String))"],
+            ["e", "Nullable(Bool)"],
+        ]
+    )

From 1fcf46864493c15e855c98bbaa44c7f9c9c88d32 Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Tue, 10 Feb 2026 16:45:53 +0100
Subject: [PATCH 02/12] Fix overrided methods in StorageIcebergConfiguration

---
 .../DataLakes/DataLakeConfiguration.h         | 99 ++++++++++---------
 .../StorageObjectStorageConfiguration.h       |  8 +-
 .../test_cluster_table_function.py            |  3 -
 3 files changed, 57 insertions(+), 53 deletions(-)

diff --git a/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h b/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
index 80fc5c4e2cad..1525c286c630 100644
--- a/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
+++ b/src/Storages/ObjectStorage/DataLakes/DataLakeConfiguration.h
@@ -435,6 +435,15 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
 public:
     explicit StorageIcebergConfiguration(DataLakeStorageSettingsPtr settings_) : settings(settings_) {}
  
+    void initialize(
+        ASTs & engine_args,
+        ContextPtr local_context,
+        bool with_table_structure) override
+    {
+        createDynamicConfiguration(engine_args, local_context);
+        getImpl().initialize(engine_args, local_context, with_table_structure);
+    }
+
     ObjectStorageType getType() const override { return getImpl().getType(); }
 
     std::string getTypeName() const override { return getImpl().getTypeName(); }
@@ -478,6 +487,10 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
 
     std::optional<size_t> totalRows(ContextPtr context) override { return getImpl().totalRows(context); }
     std::optional<size_t> totalBytes(ContextPtr context) override { return getImpl().totalBytes(context); }
+    bool isDataSortedBySortingKey(StorageMetadataPtr storage_metadata, ContextPtr context) const override
+        { return getImpl().isDataSortedBySortingKey(storage_metadata, context); }
+
+    bool needsUpdateForSchemaConsistency() const override  { return getImpl().needsUpdateForSchemaConsistency(); }
 
     IDataLakeMetadata * getExternalMetadata() override { return getImpl().getExternalMetadata(); }
 
@@ -520,10 +533,13 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
     void initPartitionStrategy(ASTPtr partition_by, const ColumnsDescription & columns, ContextPtr context) override
         { getImpl().initPartitionStrategy(partition_by, columns, context); }
 
+    StorageInMemoryMetadata getStorageSnapshotMetadata(ContextPtr local_context) const override
+        { return getImpl().getStorageSnapshotMetadata(local_context); }
     std::optional<ColumnsDescription> tryGetTableStructureFromMetadata(ContextPtr local_context) const override
         { return getImpl().tryGetTableStructureFromMetadata(local_context); }
 
     bool supportsFileIterator() const override { return getImpl().supportsFileIterator(); }
+    bool supportsParallelInsert() const override { return getImpl().supportsParallelInsert(); }
     bool supportsWrites() const override { return getImpl().supportsWrites(); }
 
     bool supportsPartialPathPrefix() const override { return getImpl().supportsPartialPathPrefix(); }
@@ -580,7 +596,6 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
     {
         getImpl().mutate(commands, context, storage_id, metadata_snapshot, catalog, format_settings);
     }
-
     void checkMutationIsPossible(const MutationCommands & commands) override { getImpl().checkMutationIsPossible(commands); }
 
     void checkAlterIsPossible(const AlterCommands & commands) override { getImpl().checkAlterIsPossible(commands); }
@@ -589,15 +604,6 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
 
     const DataLakeStorageSettings & getDataLakeSettings() const override { return getImpl().getDataLakeSettings(); }
 
-    void initialize(
-        ASTs & engine_args,
-        ContextPtr local_context,
-        bool with_table_structure) override
-    {
-        createDynamicConfiguration(engine_args, local_context);
-        getImpl().initialize(engine_args, local_context, with_table_structure);
-    }
-
     ASTPtr createArgsWithAccessData() const override
     {
         return getImpl().createArgsWithAccessData();
@@ -607,41 +613,9 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
         { getImpl().fromNamedCollection(collection, context); }
     void fromAST(ASTs & args, ContextPtr context, bool with_structure) override
         { getImpl().fromAST(args, context, with_structure); }
+    void fromDisk(const String & disk_name, ASTs & args, ContextPtr context, bool with_structure) override
+        { getImpl().fromDisk(disk_name, args, context, with_structure); }
 
-    const String & getFormat() const override { return getImpl().getFormat(); }
-    const String & getCompressionMethod() const override { return getImpl().getCompressionMethod(); }
-    const String & getStructure() const override { return getImpl().getStructure(); }
-
-    PartitionStrategyFactory::StrategyType getPartitionStrategyType() const override { return getImpl().getPartitionStrategyType(); }
-    bool getPartitionColumnsInDataFile() const override { return getImpl().getPartitionColumnsInDataFile(); }
-    std::shared_ptr<IPartitionStrategy> getPartitionStrategy() const override { return getImpl().getPartitionStrategy(); }
-
-    void setFormat(const String & format_) override { getImpl().setFormat(format_); }
-    void setCompressionMethod(const String & compression_method_) override { getImpl().setCompressionMethod(compression_method_); }
-    void setStructure(const String & structure_) override { getImpl().setStructure(structure_); }
-
-    void setPartitionStrategyType(PartitionStrategyFactory::StrategyType partition_strategy_type_) override
-        { getImpl().setPartitionStrategyType(partition_strategy_type_); }
-    void setPartitionColumnsInDataFile(bool partition_columns_in_data_file_) override
-        { getImpl().setPartitionColumnsInDataFile(partition_columns_in_data_file_); }
-    void setPartitionStrategy(const std::shared_ptr<IPartitionStrategy> & partition_strategy_) override
-        { getImpl().setPartitionStrategy(partition_strategy_); }
-
-    ColumnMapperPtr getColumnMapperForObject(ObjectInfoPtr obj) const override { return getImpl().getColumnMapperForObject(obj); }
-
-    ColumnMapperPtr getColumnMapperForCurrentSchema(StorageMetadataPtr storage_metadata_snapshot, ContextPtr context) const override
-        { return getImpl().getColumnMapperForCurrentSchema(storage_metadata_snapshot, context); }
-
-    std::shared_ptr<DataLake::ICatalog> getCatalog(ContextPtr context, bool is_attach) const override
-        { return getImpl().getCatalog(context, is_attach); }
-
-    bool optimize(const StorageMetadataPtr & metadata_snapshot, ContextPtr context, const std::optional<FormatSettings> & format_settings) override
-        { return getImpl().optimize(metadata_snapshot, context, format_settings); }
-
-    StorageInMemoryMetadata getStorageSnapshotMetadata(ContextPtr local_context) const override
-        { return getImpl().getStorageSnapshotMetadata(local_context); }
-
-protected:
     /// Find storage_type argument and remove it from args if exists.
     /// Return storage type.
     ObjectStorageType extractDynamicStorageType(ASTs & args, ContextPtr context, ASTPtr * type_arg) const override
@@ -713,14 +687,47 @@ class StorageIcebergConfiguration : public StorageObjectStorageConfiguration, pu
         return type;
     }
 
+    const String & getFormat() const override { return getImpl().getFormat(); }
+    const String & getCompressionMethod() const override { return getImpl().getCompressionMethod(); }
+    const String & getStructure() const override { return getImpl().getStructure(); }
+
+    PartitionStrategyFactory::StrategyType getPartitionStrategyType() const override { return getImpl().getPartitionStrategyType(); }
+    bool getPartitionColumnsInDataFile() const override { return getImpl().getPartitionColumnsInDataFile(); }
+    std::shared_ptr<IPartitionStrategy> getPartitionStrategy() const override { return getImpl().getPartitionStrategy(); }
+
+    void setFormat(const String & format_) override { getImpl().setFormat(format_); }
+    void setCompressionMethod(const String & compression_method_) override { getImpl().setCompressionMethod(compression_method_); }
+    void setStructure(const String & structure_) override { getImpl().setStructure(structure_); }
+
+    void setPartitionStrategyType(PartitionStrategyFactory::StrategyType partition_strategy_type_) override
+        { getImpl().setPartitionStrategyType(partition_strategy_type_); }
+    void setPartitionColumnsInDataFile(bool partition_columns_in_data_file_) override
+        { getImpl().setPartitionColumnsInDataFile(partition_columns_in_data_file_); }
+    void setPartitionStrategy(const std::shared_ptr<IPartitionStrategy> & partition_strategy_) override
+        { getImpl().setPartitionStrategy(partition_strategy_); }
+
+    void assertInitialized() const override { getImpl().assertInitialized(); }
+
+    ColumnMapperPtr getColumnMapperForObject(ObjectInfoPtr obj) const override { return getImpl().getColumnMapperForObject(obj); }
+
+    ColumnMapperPtr getColumnMapperForCurrentSchema(StorageMetadataPtr storage_metadata_snapshot, ContextPtr context) const override
+        { return getImpl().getColumnMapperForCurrentSchema(storage_metadata_snapshot, context); }
+
+    std::shared_ptr<DataLake::ICatalog> getCatalog(ContextPtr context, bool is_attach) const override
+        { return getImpl().getCatalog(context, is_attach); }
+
+    bool optimize(const StorageMetadataPtr & metadata_snapshot, ContextPtr context, const std::optional<FormatSettings> & format_settings) override
+        { return getImpl().optimize(metadata_snapshot, context, format_settings); }
+
+    void drop(ContextPtr context) override { getImpl().drop(context); }
+
+protected:
     void createDynamicConfiguration(ASTs & args, ContextPtr context)
     {
         ObjectStorageType type = extractDynamicStorageType(args, context, nullptr);
         createDynamicStorage(type);
     }
 
-    void assertInitialized() const override { getImpl().assertInitialized(); }
-
 private:
     inline StorageObjectStorageConfiguration & getImpl() const
     {
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
index 239f00812a8d..54cf793da726 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageConfiguration.h
@@ -253,6 +253,10 @@ class StorageObjectStorageConfiguration
 
     virtual void fromNamedCollection(const NamedCollection & collection, ContextPtr context) = 0;
     virtual void fromAST(ASTs & args, ContextPtr context, bool with_structure) = 0;
+    virtual void fromDisk(const String & /*disk_name*/, ASTs & /*args*/, ContextPtr /*context*/, bool /*with_structure*/)
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "method fromDisk is not implemented");
+    }
 
     virtual ObjectStorageType extractDynamicStorageType(ASTs & /* args */, ContextPtr /* context */, ASTPtr * /* type_arg */) const
     { return ObjectStorageType::None; }
@@ -310,10 +314,6 @@ class StorageObjectStorageConfiguration
 
 protected:
     void initializeFromParsedArguments(const StorageParsedArguments & parsed_arguments);
-    virtual void fromDisk(const String & /*disk_name*/, ASTs & /*args*/, ContextPtr /*context*/, bool /*with_structure*/)
-    {
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "method fromDisk is not implemented");
-    }
 
     bool initialized = false;
 
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
index 7250700e2726..d964efe6ee69 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
@@ -250,9 +250,6 @@ def make_query_from_table(alt_syntax=False):
     count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_with_type_in_nc, 0, "table engine with storage type in named collection")
     count_secondary_subqueries(started_cluster_iceberg_with_spark, query_id_pure_table_engine_cluster_with_type_in_nc, 1, "table engine with cluster setting with storage type in named collection")
 
-    # write 3 times
-    assert int(instance.query(f"SELECT count() FROM {table_function_expr_cluster}")) == 100 * 3
-
 
 @pytest.mark.parametrize("format_version", ["1", "2"])
 @pytest.mark.parametrize("storage_type", ["s3", "azure"])

From e940934824c0f2a2ba3e576a760f7d68ec6df845 Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Tue, 10 Feb 2026 17:40:13 +0100
Subject: [PATCH 03/12] Fix create table, fix test

---
 .../StorageObjectStorageCluster.cpp           |  7 ++++++
 tests/integration/helpers/iceberg_utils.py    | 23 +++++++++++--------
 2 files changed, 21 insertions(+), 9 deletions(-)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 329dd39f56e9..aa063fb6c8d2 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -109,6 +109,13 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
 
     auto log_ = getLogger("StorageObjectStorageCluster");
 
+    if (!is_table_function && !columns_in_table_or_function_definition.empty() && !is_datalake_query && mode_ == LoadingStrictnessLevel::CREATE)
+    {
+        LOG_DEBUG(log_, "Creating new storage with specified columns");
+        configuration->create(
+            object_storage, context_, columns_in_table_or_function_definition, partition_by, order_by, if_not_exists, catalog, table_id_);
+    }
+
     try
     {
         if (!do_lazy_init)
diff --git a/tests/integration/helpers/iceberg_utils.py b/tests/integration/helpers/iceberg_utils.py
index 592b4415ccd4..0849f628b0f9 100644
--- a/tests/integration/helpers/iceberg_utils.py
+++ b/tests/integration/helpers/iceberg_utils.py
@@ -308,16 +308,21 @@ def get_creation_expression(
                 iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
-            return (
-                f"""
-                DROP TABLE IF EXISTS {table_name};
-                CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
-                ENGINE=Iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
-                {order_by}
-                {partition_by}
-                {settings_expression}
+            if table_function:
+                return f"""
+                    iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}', format={format})
                 """
-            )
+            else:
+                return (
+                    f"""
+                    DROP TABLE IF EXISTS {table_name};
+                    CREATE TABLE {if_not_exists_prefix} {table_name} {schema}
+                    ENGINE=Iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                    {order_by}
+                    {partition_by}
+                    {settings_expression}
+                    """
+                )
 
     else:
         raise Exception(f"Unknown iceberg storage type: {storage_type}")

From c74753a5122af2f742bb463a7c3e1c81c24b4ee3 Mon Sep 17 00:00:00 2001
From: Vasily Nemkov <vnemkov@altinity.com>
Date: Wed, 12 Nov 2025 15:02:07 +0100
Subject: [PATCH 04/12] Merge pull request #1120 from
 Altinity/feature/antalya-25.8/iceberg_local_cluster

icebergLocalCluster table function
---
 src/Databases/DataLake/DatabaseDataLake.cpp   |  2 +-
 .../ObjectStorage/Local/Configuration.cpp     | 17 +++++++++++
 .../ObjectStorage/Local/Configuration.h       |  2 ++
 .../StorageObjectStorageCluster.cpp           |  2 ++
 .../registerStorageObjectStorage.cpp          |  4 ++-
 .../TableFunctionObjectStorage.cpp            | 19 ++----------
 .../TableFunctionObjectStorageCluster.h       |  1 +
 ...leFunctionObjectStorageClusterFallback.cpp | 29 +++++++++++++++++++
 src/TableFunctions/registerTableFunctions.cpp |  1 -
 src/TableFunctions/registerTableFunctions.h   |  1 -
 tests/integration/helpers/iceberg_utils.py    |  2 +-
 .../test_cluster_table_function.py            |  2 +-
 .../test_minmax_pruning_with_null.py          |  1 +
 13 files changed, 60 insertions(+), 23 deletions(-)

diff --git a/src/Databases/DataLake/DatabaseDataLake.cpp b/src/Databases/DataLake/DatabaseDataLake.cpp
index e96b5ff7d5ab..f93aa6a6bf4d 100644
--- a/src/Databases/DataLake/DatabaseDataLake.cpp
+++ b/src/Databases/DataLake/DatabaseDataLake.cpp
@@ -595,7 +595,7 @@ StoragePtr DatabaseDataLake::tryGetTableImpl(const String & name, ContextPtr con
         /* partition_by */nullptr,
         /* order_by */nullptr,
         context_copy,
-        /* comment */"",
+        /* comment */ "",
         getFormatSettings(context_copy),
         LoadingStrictnessLevel::CREATE,
         getCatalog(),
diff --git a/src/Storages/ObjectStorage/Local/Configuration.cpp b/src/Storages/ObjectStorage/Local/Configuration.cpp
index 2d88b97dfebf..1a8dc9c75551 100644
--- a/src/Storages/ObjectStorage/Local/Configuration.cpp
+++ b/src/Storages/ObjectStorage/Local/Configuration.cpp
@@ -126,4 +126,21 @@ void StorageLocalConfiguration::fromNamedCollection(const NamedCollection & coll
     initializeFromParsedArguments(parsed_arguments);
     paths = {path};
 }
+
+ASTPtr StorageLocalConfiguration::createArgsWithAccessData() const
+{
+    auto arguments = make_intrusive<ASTExpressionList>();
+
+    arguments->children.push_back(make_intrusive<ASTLiteral>(path.path));
+    if (getFormat() != "auto")
+        arguments->children.push_back(make_intrusive<ASTLiteral>(getFormat()));
+    if (getStructure() != "auto")
+        arguments->children.push_back(make_intrusive<ASTLiteral>(getStructure()));
+    if (getCompressionMethod() != "auto")
+        arguments->children.push_back(make_intrusive<ASTLiteral>(getCompressionMethod()));
+
+    return arguments;
+}
+
+
 }
diff --git a/src/Storages/ObjectStorage/Local/Configuration.h b/src/Storages/ObjectStorage/Local/Configuration.h
index bfed2088d8e8..c0a211f731ce 100644
--- a/src/Storages/ObjectStorage/Local/Configuration.h
+++ b/src/Storages/ObjectStorage/Local/Configuration.h
@@ -81,6 +81,8 @@ class StorageLocalConfiguration : public StorageObjectStorageConfiguration
 
     void addStructureAndFormatToArgsIfNeeded(ASTs &, const String &, const String &, ContextPtr, bool) override { }
 
+    ASTPtr createArgsWithAccessData() const override;
+
 protected:
     void fromAST(ASTs & args, ContextPtr context, bool with_structure) override;
     void fromDisk(const String & disk_name_, ASTs & args, ContextPtr context, bool with_structure) override;
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index aa063fb6c8d2..947072fd33d3 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -313,6 +313,7 @@ void StorageObjectStorageCluster::updateQueryForDistributedEngineIfNeeded(ASTPtr
         {"IcebergS3", "icebergS3"},
         {"IcebergAzure", "icebergAzure"},
         {"IcebergHDFS", "icebergHDFS"},
+        {"IcebergLocal", "icebergLocal"},
         {"DeltaLake", "deltaLake"},
         {"DeltaLakeS3", "deltaLakeS3"},
         {"DeltaLakeAzure", "deltaLakeAzure"},
@@ -428,6 +429,7 @@ void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
             {"icebergS3", "icebergS3Cluster"},
             {"icebergAzure", "icebergAzureCluster"},
             {"icebergHDFS", "icebergHDFSCluster"},
+            {"icebergLocal", "icebergLocalCluster"},
             {"deltaLake", "deltaLakeCluster"},
             {"deltaLakeS3", "deltaLakeS3Cluster"},
             {"deltaLakeAzure", "deltaLakeAzureCluster"},
diff --git a/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp b/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
index 89c2d4e71485..22cb726963aa 100644
--- a/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
+++ b/src/Storages/ObjectStorage/registerStorageObjectStorage.cpp
@@ -104,7 +104,9 @@ createStorageObjectStorage(const StorageFactory::Arguments & args, StorageObject
         args.mode,
         configuration->getCatalog(context, args.query.attach),
         args.query.if_not_exists,
-        /* is_datalake_query*/ false);
+        /* is_datalake_query */ false,
+        /* is_table_function */ false,
+        /* lazy_init */ false);
 }
 
 #endif
diff --git a/src/TableFunctions/TableFunctionObjectStorage.cpp b/src/TableFunctions/TableFunctionObjectStorage.cpp
index 444ded628a1a..d400e963a5d9 100644
--- a/src/TableFunctions/TableFunctionObjectStorage.cpp
+++ b/src/TableFunctions/TableFunctionObjectStorage.cpp
@@ -274,10 +274,10 @@ StoragePtr TableFunctionObjectStorage<Definition, Configuration, is_data_lake>::
             /* comment */ String{},
             /* format_settings */ std::nullopt, /// No format_settings
             /* mode */ LoadingStrictnessLevel::CREATE,
-            configuration->getCatalog(context, /*attach*/ false),
+            configuration->getCatalog(context, /* attach */ false),
             /* if_not_exists */ false,
             /* is_datalake_query*/ false,
-            /* is_table_function */true);
+            /* is_table_function */ true);
 
         storage->startup();
         return storage;
@@ -427,18 +427,6 @@ template class TableFunctionObjectStorage<DeltaLakeAzureClusterDefinition, Stora
 template class TableFunctionObjectStorage<HudiClusterDefinition, StorageS3HudiConfiguration, true>;
 #endif
 
-#if USE_AVRO
-void registerTableFunctionIceberg(TableFunctionFactory & factory)
-{
-    factory.registerFunction<TableFunctionIcebergLocal>(
-        {.documentation
-         = {.description = R"(The table function can be used to read the Iceberg table stored locally.)",
-            .examples{{IcebergLocalDefinition::name, "SELECT * FROM icebergLocal(filename)", ""}},
-            .category = FunctionDocumentation::Category::TableFunction},
-         .allow_readonly = false});
-}
-#endif
-
 
 #if USE_AVRO
 void registerTableFunctionPaimon(TableFunctionFactory & factory)
@@ -486,9 +474,6 @@ void registerTableFunctionPaimon(TableFunctionFactory & factory)
 void registerDataLakeTableFunctions(TableFunctionFactory & factory)
 {
     UNUSED(factory);
-#if USE_AVRO
-    registerTableFunctionIceberg(factory);
-#endif
 
 #if USE_AVRO
     registerTableFunctionPaimon(factory);
diff --git a/src/TableFunctions/TableFunctionObjectStorageCluster.h b/src/TableFunctions/TableFunctionObjectStorageCluster.h
index 483fe2636227..56500c9e2851 100644
--- a/src/TableFunctions/TableFunctionObjectStorageCluster.h
+++ b/src/TableFunctions/TableFunctionObjectStorageCluster.h
@@ -70,6 +70,7 @@ using TableFunctionHDFSCluster = TableFunctionObjectStorageCluster<HDFSClusterDe
 
 #if USE_AVRO
 using TableFunctionIcebergCluster = TableFunctionObjectStorageCluster<IcebergClusterDefinition, StorageIcebergConfiguration, true>;
+using TableFunctionIcebergLocalCluster = TableFunctionObjectStorageCluster<IcebergLocalClusterDefinition, StorageLocalIcebergConfiguration, true>;
 #endif
 
 #if USE_AVRO
diff --git a/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
index 26c29fe7cff6..655bd9ac96a6 100644
--- a/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
+++ b/src/TableFunctions/TableFunctionObjectStorageClusterFallback.cpp
@@ -67,6 +67,13 @@ struct IcebergHDFSClusterFallbackDefinition
     static constexpr auto storage_engine_cluster_name = "IcebergHDFSCluster";
 };
 
+struct IcebergLocalClusterFallbackDefinition
+{
+    static constexpr auto name = "icebergLocal";
+    static constexpr auto storage_engine_name = "Local";
+    static constexpr auto storage_engine_cluster_name = "IcebergLocalCluster";
+};
+
 struct DeltaLakeClusterFallbackDefinition
 {
     static constexpr auto name = "deltaLake";
@@ -163,6 +170,7 @@ using TableFunctionHDFSClusterFallback = TableFunctionObjectStorageClusterFallba
 
 #if USE_AVRO
 using TableFunctionIcebergClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergClusterFallbackDefinition, TableFunctionIcebergCluster>;
+using TableFunctionIcebergLocalClusterFallback = TableFunctionObjectStorageClusterFallback<IcebergLocalClusterFallbackDefinition, TableFunctionIcebergLocalCluster>;
 #endif
 
 #if USE_AVRO && USE_AWS_S3
@@ -286,6 +294,27 @@ void registerTableFunctionObjectStorageClusterFallback(TableFunctionFactory & fa
         .allow_readonly = false
     }
     );
+
+    factory.registerFunction<TableFunctionIcebergLocalClusterFallback>(
+    {
+        .documentation = {
+            .description=R"(The table function can be used to read the Iceberg table stored on shared disk in parallel for many nodes in a specified cluster or from single node.)",
+            .examples{
+                {
+                    "icebergLocal",
+                    "SELECT * FROM icebergLocal(filename)", ""
+                },
+                {
+                    "icebergLocal",
+                    "SELECT * FROM icebergLocal(filename) "
+                    "SETTINGS object_storage_cluster='cluster'", ""
+                },
+            },
+            .category = FunctionDocumentation::Category::TableFunction
+        },
+        .allow_readonly = false
+    }
+    );
 #endif
 
 #if USE_AVRO && USE_AWS_S3
diff --git a/src/TableFunctions/registerTableFunctions.cpp b/src/TableFunctions/registerTableFunctions.cpp
index 77723732080d..7b0c751fc24c 100644
--- a/src/TableFunctions/registerTableFunctions.cpp
+++ b/src/TableFunctions/registerTableFunctions.cpp
@@ -70,7 +70,6 @@ void registerTableFunctions()
     registerTableFunctionObjectStorage(factory);
     registerTableFunctionObjectStorageCluster(factory);
     registerTableFunctionObjectStorageClusterFallback(factory);
-    registerDataLakeTableFunctions(factory);
     registerDataLakeClusterTableFunctions(factory);
 
 #if USE_YTSAURUS
diff --git a/src/TableFunctions/registerTableFunctions.h b/src/TableFunctions/registerTableFunctions.h
index 49a65507cf9d..01cee09e6e1e 100644
--- a/src/TableFunctions/registerTableFunctions.h
+++ b/src/TableFunctions/registerTableFunctions.h
@@ -71,7 +71,6 @@ void registerTableFunctionExplain(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorage(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorageCluster(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorageClusterFallback(TableFunctionFactory & factory);
-void registerDataLakeTableFunctions(TableFunctionFactory & factory);
 void registerDataLakeClusterTableFunctions(TableFunctionFactory & factory);
 
 void registerTableFunctionTimeSeries(TableFunctionFactory & factory);
diff --git a/tests/integration/helpers/iceberg_utils.py b/tests/integration/helpers/iceberg_utils.py
index 0849f628b0f9..9c5afb397626 100644
--- a/tests/integration/helpers/iceberg_utils.py
+++ b/tests/integration/helpers/iceberg_utils.py
@@ -305,7 +305,7 @@ def get_creation_expression(
         if run_on_cluster:
             assert table_function
             return f"""
-                iceberg{engine_part}({storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
             if table_function:
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
index d964efe6ee69..8fcca49d2524 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
@@ -121,7 +121,7 @@ def make_query_from_function(
             storage_type_in_named_collection=storage_type_in_named_collection,
         )
         query_id = str(uuid.uuid4())
-        settings = "SETTINGS object_storage_cluster='cluster_simple'" if alt_syntax else ""
+        settings = f"SETTINGS object_storage_cluster='cluster_simple'" if (alt_syntax and not run_on_cluster) else ""
         if remote:
             query = f"SELECT * FROM remote('node2', {expr}) {settings}"
         else:
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_minmax_pruning_with_null.py b/tests/integration/test_storage_iceberg_with_spark/test_minmax_pruning_with_null.py
index ceb630acbd73..217abdcd4b25 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_minmax_pruning_with_null.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_minmax_pruning_with_null.py
@@ -21,6 +21,7 @@ def execute_spark_query(query: str):
             storage_type,
             TABLE_NAME,
             query,
+            additional_nodes=["node2", "node3"] if storage_type=="local" else [],
         )
 
     execute_spark_query(

From c74de250994b4e81b3f362c9eaf5a26d67e71317 Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Tue, 10 Feb 2026 19:00:34 +0100
Subject: [PATCH 05/12] Fix metadata initialize

---
 src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 947072fd33d3..8947a95013ec 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -105,7 +105,7 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
     configuration->initPartitionStrategy(partition_by, columns_in_table_or_function_definition, context_);
 
     const bool need_resolve_columns_or_format = columns_in_table_or_function_definition.empty() || (configuration->getFormat() == "auto");
-    const bool do_lazy_init = lazy_init && !need_resolve_columns_or_format;
+    const bool do_lazy_init = lazy_init && !need_resolve_columns_or_format && !configuration->needsUpdateForSchemaConsistency();
 
     auto log_ = getLogger("StorageObjectStorageCluster");
 

From 79b334c31bc77a247e10750866b8a02eb571222a Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Tue, 10 Feb 2026 19:09:22 +0100
Subject: [PATCH 06/12] Fix delete and insert

---
 .../ObjectStorage/StorageObjectStorageCluster.cpp | 15 +++++++++++++++
 .../ObjectStorage/StorageObjectStorageCluster.h   |  4 ++++
 2 files changed, 19 insertions(+)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 8947a95013ec..ae1895fbdd1f 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -888,4 +888,19 @@ void StorageObjectStorageCluster::onActionLockRemove(StorageActionBlockType acti
     IStorageCluster::onActionLockRemove(action_type);
 }
 
+bool StorageObjectStorageCluster::supportsDelete() const
+{
+    if (pure_storage)
+        return pure_storage->supportsDelete();
+    return IStorageCluster::supportsDelete();
+}
+
+bool StorageObjectStorageCluster::supportsParallelInsert() const
+{
+    if (pure_storage)
+        return pure_storage->supportsParallelInsert();
+    return IStorageCluster::supportsParallelInsert();
+}
+
+
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
index 10ab3af0b69e..aaf8c714f04d 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
@@ -125,6 +125,10 @@ class StorageObjectStorageCluster : public IStorageCluster
 
     void updateExternalDynamicMetadataIfExists(ContextPtr query_context) override;
 
+    bool supportsDelete() const override;
+
+    bool supportsParallelInsert() const override;
+
 private:
     void updateQueryToSendIfNeeded(
         ASTPtr & query,

From 5a7060fec29144a185cf697be4b939c0e2f96016 Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Wed, 11 Feb 2026 11:37:39 +0100
Subject: [PATCH 07/12] Fix metadata loading

---
 src/Storages/IStorageCluster.cpp                      |  2 ++
 .../ObjectStorage/StorageObjectStorageCluster.cpp     | 11 ++++-------
 2 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/src/Storages/IStorageCluster.cpp b/src/Storages/IStorageCluster.cpp
index b49f13435c0e..8166faceab30 100644
--- a/src/Storages/IStorageCluster.cpp
+++ b/src/Storages/IStorageCluster.cpp
@@ -121,6 +121,8 @@ void ReadFromCluster::createExtension(const ActionsDAG::Node * predicate)
     if (extension)
         return;
 
+    storage->updateExternalDynamicMetadataIfExists(context);
+
     extension = storage->getTaskIteratorExtension(
         predicate,
         filter_actions_dag ? filter_actions_dag.get() : query_info.filter_actions_dag.get(),
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index ae1895fbdd1f..9f342fe88621 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -120,9 +120,6 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
     {
         if (!do_lazy_init)
         {
-            /// We allow exceptions to be thrown on update(),
-            /// because Cluster engine can only be used as table function,
-            /// so no lazy initialization is allowed.
             configuration->update(
                 object_storage,
                 context_,
@@ -182,7 +179,7 @@ StorageObjectStorageCluster::StorageObjectStorageCluster(
 
     /// This will update metadata which contains specific information about table state (e.g. for Iceberg)
 
-    if (configuration->needsUpdateForSchemaConsistency())
+    if (!do_lazy_init && is_table_function && configuration->needsUpdateForSchemaConsistency())
     {
         auto metadata_snapshot = configuration->getStorageSnapshotMetadata(context_);
         setInMemoryMetadata(metadata_snapshot);
@@ -486,9 +483,6 @@ void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
 
 void StorageObjectStorageCluster::updateExternalDynamicMetadataIfExists(ContextPtr query_context)
 {
-    if (getClusterName(query_context).empty())
-        return pure_storage->updateExternalDynamicMetadataIfExists(query_context);
-
     configuration->update(
         object_storage,
         query_context,
@@ -498,6 +492,9 @@ void StorageObjectStorageCluster::updateExternalDynamicMetadataIfExists(ContextP
         auto metadata_snapshot = configuration->getStorageSnapshotMetadata(query_context);
         setInMemoryMetadata(metadata_snapshot);
     }
+
+    if (pure_storage)
+        pure_storage->updateExternalDynamicMetadataIfExists(query_context);
 }
 
 RemoteQueryExecutor::Extension StorageObjectStorageCluster::getTaskIteratorExtension(

From 5fe65fe5f882054373c84eb82b1c35e44ff122ba Mon Sep 17 00:00:00 2001
From: Vasily Nemkov <vnemkov@altinity.com>
Date: Mon, 13 Oct 2025 19:02:01 +0200
Subject: [PATCH 08/12] Merge pull request #1074 from
 Altinity/bugfix/antalya-25.8/prefer_large_blocks

Fix prefersLargeBlocks for cluster storage
---
 src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp | 6 ++++++
 src/Storages/ObjectStorage/StorageObjectStorageCluster.h   | 2 ++
 2 files changed, 8 insertions(+)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 9f342fe88621..ec249b93a391 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -899,5 +899,11 @@ bool StorageObjectStorageCluster::supportsParallelInsert() const
     return IStorageCluster::supportsParallelInsert();
 }
 
+bool StorageObjectStorageCluster::prefersLargeBlocks() const
+{
+    if (pure_storage)
+        return pure_storage->prefersLargeBlocks();
+    return IStorageCluster::prefersLargeBlocks();
+}
 
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
index aaf8c714f04d..3f3ef4b9e4a6 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
@@ -129,6 +129,8 @@ class StorageObjectStorageCluster : public IStorageCluster
 
     bool supportsParallelInsert() const override;
 
+    bool prefersLargeBlocks() const override;
+
 private:
     void updateQueryToSendIfNeeded(
         ASTPtr & query,

From 5e18a1c2e49bc955a03acddbd5e284c72a90158a Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Thu, 13 Nov 2025 11:25:27 +0100
Subject: [PATCH 09/12] More virtual methods for StorageObjectStorageCluster

---
 src/Storages/IStorage.h                       |  2 +-
 .../StorageObjectStorageCluster.cpp           | 63 +++++++++++++++++++
 .../StorageObjectStorageCluster.h             | 16 +++++
 3 files changed, 80 insertions(+), 1 deletion(-)

diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index 7179dbbfa8ee..d297a284855c 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -435,6 +435,7 @@ class IStorage : public std::enable_shared_from_this<IStorage>, public TypePromo
         size_t /*max_block_size*/,
         size_t /*num_streams*/);
 
+public:
     /// Should we process blocks of data returned by the storage in parallel
     /// even when the storage returned only one stream of data for reading?
     /// It is beneficial, for example, when you read from a file quickly,
@@ -445,7 +446,6 @@ class IStorage : public std::enable_shared_from_this<IStorage>, public TypePromo
     /// useless).
     virtual bool parallelizeOutputAfterReading(ContextPtr) const { return !isSystemStorage(); }
 
-public:
     /// Other version of read which adds reading step to query plan.
     /// Default implementation creates ReadFromStorageStep and uses usual read.
     /// Can be called after `shutdown`, but not after `drop`.
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index ec249b93a391..9a44b2959314 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -906,4 +906,67 @@ bool StorageObjectStorageCluster::prefersLargeBlocks() const
     return IStorageCluster::prefersLargeBlocks();
 }
 
+bool StorageObjectStorageCluster::supportsPartitionBy() const
+{
+    if (pure_storage)
+        return pure_storage->supportsPartitionBy();
+    return IStorageCluster::supportsPartitionBy();
+}
+
+bool StorageObjectStorageCluster::supportsSubcolumns() const
+{
+    if (pure_storage)
+        return pure_storage->supportsSubcolumns();
+    return IStorageCluster::supportsSubcolumns();
+}
+
+bool StorageObjectStorageCluster::supportsDynamicSubcolumns() const
+{
+    if (pure_storage)
+        return pure_storage->supportsDynamicSubcolumns();
+    return IStorageCluster::supportsDynamicSubcolumns();
+}
+
+bool StorageObjectStorageCluster::supportsTrivialCountOptimization(const StorageSnapshotPtr & snapshot, ContextPtr context) const
+{
+    if (pure_storage)
+        return pure_storage->supportsTrivialCountOptimization(snapshot, context);
+    return IStorageCluster::supportsTrivialCountOptimization(snapshot, context);
+}
+
+bool StorageObjectStorageCluster::supportsPrewhere() const
+{
+    if (pure_storage)
+        return pure_storage->supportsPrewhere();
+    return IStorageCluster::supportsPrewhere();
+}
+
+bool StorageObjectStorageCluster::canMoveConditionsToPrewhere() const
+{
+    if (pure_storage)
+        return pure_storage->canMoveConditionsToPrewhere();
+    return IStorageCluster::canMoveConditionsToPrewhere();
+}
+
+std::optional<NameSet> StorageObjectStorageCluster::supportedPrewhereColumns() const
+{
+    if (pure_storage)
+        return pure_storage->supportedPrewhereColumns();
+    return IStorageCluster::supportedPrewhereColumns();
+}
+
+IStorageCluster::ColumnSizeByName StorageObjectStorageCluster::getColumnSizes() const
+{
+    if (pure_storage)
+        return pure_storage->getColumnSizes();
+    return IStorageCluster::getColumnSizes();
+}
+
+bool StorageObjectStorageCluster::parallelizeOutputAfterReading(ContextPtr context) const
+{
+    if (pure_storage)
+        return pure_storage->parallelizeOutputAfterReading(context);
+    return IStorageCluster::parallelizeOutputAfterReading(context);
+}
+
 }
diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
index 3f3ef4b9e4a6..057902257482 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.h
@@ -131,6 +131,22 @@ class StorageObjectStorageCluster : public IStorageCluster
 
     bool prefersLargeBlocks() const override;
 
+    bool supportsPartitionBy() const override;
+
+    bool supportsSubcolumns() const override;
+
+    bool supportsDynamicSubcolumns() const override;
+
+    bool supportsTrivialCountOptimization(const StorageSnapshotPtr &, ContextPtr) const override;
+
+    /// Things required for PREWHERE.
+    bool supportsPrewhere() const override;
+    bool canMoveConditionsToPrewhere() const override;
+    std::optional<NameSet> supportedPrewhereColumns() const override;
+    ColumnSizeByName getColumnSizes() const override;
+
+    bool parallelizeOutputAfterReading(ContextPtr context) const override;
+
 private:
     void updateQueryToSendIfNeeded(
         ASTPtr & query,

From fb0febdf20b03b9bb75f148b0b4db6c578fb3a6f Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Wed, 11 Feb 2026 12:54:05 +0100
Subject: [PATCH 10/12] Fix mask sensitive info test

---
 .../test_mask_sensitive_info/test.py          | 54 ++++++-------------
 1 file changed, 15 insertions(+), 39 deletions(-)

diff --git a/tests/integration/test_mask_sensitive_info/test.py b/tests/integration/test_mask_sensitive_info/test.py
index b2fd3234d851..a6313d159643 100644
--- a/tests/integration/test_mask_sensitive_info/test.py
+++ b/tests/integration/test_mask_sensitive_info/test.py
@@ -301,38 +301,14 @@ def test_create_table():
         f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_3.csv', '{azure_account_name}', '{azure_account_key}')",
         f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '{azure_account_key}', 'CSV')",
         f"AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '{azure_account_key}', 'CSV', 'none')",
-        (
-            f"IcebergAzure('{azure_conn_string}', 'cont', 'test_simple.csv')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"IcebergAzure(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"Iceberg(storage_type='azure', '{azure_conn_string}', 'cont', 'test_simple.csv')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"Iceberg(storage_type='azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '{azure_account_key}')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"Iceberg(storage_type='azure', named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')",
-            "FILE_DOESNT_EXIST",
-        ),
-        (
-            f"Iceberg(storage_type='azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
-            "FILE_DOESNT_EXIST",
-        ),
+        f"IcebergAzure('{azure_conn_string}', 'cont', 'test_simple.csv')",
+        f"IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple_1.csv', '{azure_account_name}', '{azure_account_key}')",
+        f"IcebergAzure(named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_2.csv', format = 'CSV')",
+        f"IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_3.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
+        f"Iceberg(storage_type='azure', '{azure_conn_string}', 'cont', 'test_simple_4.csv')",
+        f"Iceberg(storage_type='azure', '{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '{azure_account_key}')",
+        f"Iceberg(storage_type='azure', named_collection_2, connection_string = '{azure_conn_string}', container = 'cont', blob_path = 'test_simple_6.csv', format = 'CSV')",
+        f"Iceberg(storage_type='azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_7.csv', account_name = '{azure_account_name}', account_key = '{azure_account_key}')",
 
         f"Kafka() SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '{password}', format_avro_schema_registry_url = 'http://schema_user:{password}@'",
         f"Kafka() SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '{password}', format_avro_schema_registry_url = 'http://schema_user:{password}@domain.com'",
@@ -431,13 +407,13 @@ def generate_create_table_numbered(tail):
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_4.csv', '{azure_account_name}', '[HIDDEN]', 'CSV')"),
             generate_create_table_numbered(f"(`x` int) ENGINE = AzureBlobStorage('{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '[HIDDEN]', 'CSV', 'none')"),
             generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure('{masked_azure_conn_string}', 'cont', 'test_simple.csv')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{masked_azure_conn_string}', 'cont', 'test_simple.csv')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{azure_storage_account_url}', 'cont', 'test_simple.csv', '{azure_account_name}', '[HIDDEN]')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_7.csv', format = 'CSV')"),
-            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_8.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure('{azure_storage_account_url}', 'cont', 'test_simple_1.csv', '{azure_account_name}', '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_2.csv', format = 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = IcebergAzure(named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_3.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{masked_azure_conn_string}', 'cont', 'test_simple_4.csv')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', '{azure_storage_account_url}', 'cont', 'test_simple_5.csv', '{azure_account_name}', '[HIDDEN]')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, connection_string = '{masked_azure_conn_string}', container = 'cont', blob_path = 'test_simple_6.csv', format = 'CSV')"),
+            generate_create_table_numbered(f"(`x` int) ENGINE = Iceberg(storage_type = 'azure', named_collection_2, storage_account_url = '{azure_storage_account_url}', container = 'cont', blob_path = 'test_simple_7.csv', account_name = '{azure_account_name}', account_key = '[HIDDEN]')"),
             generate_create_table_numbered("(`x` int) ENGINE = Kafka SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '[HIDDEN]', format_avro_schema_registry_url = 'http://schema_user:[HIDDEN]@'"),
             generate_create_table_numbered("(`x` int) ENGINE = Kafka SETTINGS kafka_broker_list = '127.0.0.1', kafka_topic_list = 'topic', kafka_group_name = 'group', kafka_format = 'JSONEachRow', kafka_security_protocol = 'sasl_ssl', kafka_sasl_mechanism = 'PLAIN', kafka_sasl_username = 'user', kafka_sasl_password = '[HIDDEN]', format_avro_schema_registry_url = 'http://schema_user:[HIDDEN]@domain.com'"),
             generate_create_table_numbered("(`x` int) ENGINE = S3('http://minio1:9001/root/data/test5.csv.gz', 'CSV', access_key_id = 'minio', secret_access_key = '[HIDDEN]', compression_method = 'gzip')"),

From c39c2015f2a6c8cde87f859dfe32e4eb4229255e Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Wed, 17 Dec 2025 15:18:40 +0100
Subject: [PATCH 11/12] Fix confusing cluster name and named collection name in
 cluster functions

---
 .../ObjectStorage/StorageObjectStorageCluster.cpp      | 10 +++++++++-
 tests/integration/helpers/iceberg_utils.py             |  9 ++++++---
 .../test_cluster_table_function.py                     |  6 ++++--
 3 files changed, 19 insertions(+), 6 deletions(-)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index 9a44b2959314..e008df1560da 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -399,7 +399,15 @@ void StorageObjectStorageCluster::updateQueryToSendIfNeeded(
     }
 
     ASTPtr object_storage_type_arg;
-    configuration->extractDynamicStorageType(args, context, &object_storage_type_arg);
+    if (cluster_name_in_settings)
+        configuration->extractDynamicStorageType(args, context, &object_storage_type_arg);
+    else
+    {
+        auto args_copy = args;
+        // Remove cluster name from args to avoid confusing cluster name and named collection name
+        args_copy.erase(args_copy.begin());
+        configuration->extractDynamicStorageType(args_copy, context, &object_storage_type_arg);
+    }
     ASTPtr settings_temporary_storage = nullptr;
     for (auto it = args.begin(); it != args.end(); ++it)
     {
diff --git a/tests/integration/helpers/iceberg_utils.py b/tests/integration/helpers/iceberg_utils.py
index 9c5afb397626..d6a87b84b31e 100644
--- a/tests/integration/helpers/iceberg_utils.py
+++ b/tests/integration/helpers/iceberg_utils.py
@@ -205,6 +205,7 @@ def get_creation_expression(
     additional_settings = [],
     storage_type_as_arg=False,
     storage_type_in_named_collection=False,
+    cluster_name_as_literal=True,
     **kwargs,
 ):
     settings_array = list(additional_settings)
@@ -234,6 +235,8 @@ def get_creation_expression(
     else:
         settings_expression = ""
 
+    cluster_name = "'cluster_simple'" if cluster_name_as_literal else "cluster_simple"
+
     storage_arg = storage_type
     engine_part = ""
     if (storage_type_in_named_collection):
@@ -262,7 +265,7 @@ def get_creation_expression(
 
         if run_on_cluster:
             assert table_function
-            return f"iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
+            return f"iceberg{engine_part}Cluster({cluster_name}, {storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
         else:
             if table_function:
                 return f"iceberg{engine_part}({storage_arg}, filename = 'var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format}, url = 'http://minio1:9001/{bucket}/')"
@@ -282,7 +285,7 @@ def get_creation_expression(
         if run_on_cluster:
             assert table_function
             return f"""
-                iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                iceberg{engine_part}Cluster({cluster_name}, {storage_arg}, container = '{cluster.azure_container_name}', storage_account_url = '{cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]}', blob_path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
             if table_function:
@@ -305,7 +308,7 @@ def get_creation_expression(
         if run_on_cluster:
             assert table_function
             return f"""
-                iceberg{engine_part}Cluster('cluster_simple', {storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
+                iceberg{engine_part}Cluster({cluster_name}, {storage_arg}, path = '/var/lib/clickhouse/user_files/iceberg_data/default/{table_name}/', format={format})
             """
         else:
             if table_function:
diff --git a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
index 8fcca49d2524..9b847b679a4c 100644
--- a/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
+++ b/tests/integration/test_storage_iceberg_with_spark/test_cluster_table_function.py
@@ -40,7 +40,8 @@ def count_secondary_subqueries(started_cluster, query_id, expected, comment):
 
 @pytest.mark.parametrize("format_version", ["1", "2"])
 @pytest.mark.parametrize("storage_type", ["s3", "azure", "local"])
-def test_cluster_table_function(started_cluster_iceberg_with_spark, format_version, storage_type):
+@pytest.mark.parametrize("cluster_name_as_literal", [True, False])
+def test_cluster_table_function(started_cluster_iceberg_with_spark, format_version, storage_type, cluster_name_as_literal):
     instance = started_cluster_iceberg_with_spark.instances["node1"]
     spark = started_cluster_iceberg_with_spark.spark_session
 
@@ -98,7 +99,7 @@ def add_df(mode):
 
     # Regular Query only node1
     table_function_expr = get_creation_expression(
-        storage_type, TABLE_NAME, started_cluster_iceberg_with_spark, table_function=True
+        storage_type, TABLE_NAME, started_cluster_iceberg_with_spark, table_function=True, cluster_name_as_literal=cluster_name_as_literal
     )
     select_regular = (
         instance.query(f"SELECT * FROM {table_function_expr}").strip().split()
@@ -119,6 +120,7 @@ def make_query_from_function(
             run_on_cluster=run_on_cluster,
             storage_type_as_arg=storage_type_as_arg,
             storage_type_in_named_collection=storage_type_in_named_collection,
+            cluster_name_as_literal=cluster_name_as_literal,
         )
         query_id = str(uuid.uuid4())
         settings = f"SETTINGS object_storage_cluster='cluster_simple'" if (alt_syntax and not run_on_cluster) else ""

From c9c0cbc43a524bf3d12064c63650118866ca5e1a Mon Sep 17 00:00:00 2001
From: Anton Ivashkin <ianton@live.com>
Date: Thu, 12 Feb 2026 11:14:24 +0100
Subject: [PATCH 12/12] Fix paimon functions

---
 .../StorageObjectStorageCluster.cpp              |  1 +
 .../TableFunctionObjectStorage.cpp               | 16 ++++++++++++++++
 src/TableFunctions/registerTableFunctions.cpp    |  1 +
 src/TableFunctions/registerTableFunctions.h      |  1 +
 4 files changed, 19 insertions(+)

diff --git a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
index e008df1560da..d11cec0a7889 100644
--- a/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
+++ b/src/Storages/ObjectStorage/StorageObjectStorageCluster.cpp
@@ -314,6 +314,7 @@ void StorageObjectStorageCluster::updateQueryForDistributedEngineIfNeeded(ASTPtr
         {"DeltaLake", "deltaLake"},
         {"DeltaLakeS3", "deltaLakeS3"},
         {"DeltaLakeAzure", "deltaLakeAzure"},
+        {"DeltaLakeLocal", "deltaLakeLocal"},
         {"Hudi", "hudi"}
     };
 
diff --git a/src/TableFunctions/TableFunctionObjectStorage.cpp b/src/TableFunctions/TableFunctionObjectStorage.cpp
index d400e963a5d9..6efd6edc4dfd 100644
--- a/src/TableFunctions/TableFunctionObjectStorage.cpp
+++ b/src/TableFunctions/TableFunctionObjectStorage.cpp
@@ -471,10 +471,26 @@ void registerTableFunctionPaimon(TableFunctionFactory & factory)
 }
 #endif
 
+#if USE_PARQUET && USE_DELTA_KERNEL_RS
+void registerTableFunctionDeltaLake(TableFunctionFactory & factory)
+{
+    // Register the new local Delta Lake table function
+    factory.registerFunction<TableFunctionDeltaLakeLocal>(
+        {.documentation
+         = {.description = R"(The table function can be used to read the DeltaLake table stored locally.)",
+            .examples{{DeltaLakeLocalDefinition::name, "SELECT * FROM deltaLakeLocal(path)", ""}},
+            .category = FunctionDocumentation::Category::TableFunction},
+         .allow_readonly = false});
+}
+#endif
+
 void registerDataLakeTableFunctions(TableFunctionFactory & factory)
 {
     UNUSED(factory);
 
+#if USE_PARQUET && USE_DELTA_KERNEL_RS
+    registerTableFunctionDeltaLake(factory);
+#endif
 #if USE_AVRO
     registerTableFunctionPaimon(factory);
 #endif
diff --git a/src/TableFunctions/registerTableFunctions.cpp b/src/TableFunctions/registerTableFunctions.cpp
index 7b0c751fc24c..f666a04fca35 100644
--- a/src/TableFunctions/registerTableFunctions.cpp
+++ b/src/TableFunctions/registerTableFunctions.cpp
@@ -69,6 +69,7 @@ void registerTableFunctions()
 
     registerTableFunctionObjectStorage(factory);
     registerTableFunctionObjectStorageCluster(factory);
+    registerDataLakeTableFunctions(factory);
     registerTableFunctionObjectStorageClusterFallback(factory);
     registerDataLakeClusterTableFunctions(factory);
 
diff --git a/src/TableFunctions/registerTableFunctions.h b/src/TableFunctions/registerTableFunctions.h
index 01cee09e6e1e..c04f7de19881 100644
--- a/src/TableFunctions/registerTableFunctions.h
+++ b/src/TableFunctions/registerTableFunctions.h
@@ -70,6 +70,7 @@ void registerTableFunctionExplain(TableFunctionFactory & factory);
 
 void registerTableFunctionObjectStorage(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorageCluster(TableFunctionFactory & factory);
+void registerDataLakeTableFunctions(TableFunctionFactory & factory);
 void registerTableFunctionObjectStorageClusterFallback(TableFunctionFactory & factory);
 void registerDataLakeClusterTableFunctions(TableFunctionFactory & factory);