DDLWorker.cpp 23.3 KB
Newer Older
1
#include <Interpreters/DDLWorker.h>
2 3

#include <Parsers/ASTAlterQuery.h>
4
#include <Parsers/ASTQueryWithOnCluster.h>
5 6 7
#include <Parsers/ParserQuery.h>
#include <Parsers/parseQuery.h>
#include <Parsers/queryToString.h>
8

9 10 11 12 13
#include <IO/WriteHelpers.h>
#include <IO/ReadHelpers.h>
#include <IO/Operators.h>
#include <IO/ReadBufferFromString.h>

14
#include <Storages/IStorage.h>
15
#include <DataStreams/OneBlockInputStream.h>
16

17
#include <Interpreters/executeQuery.h>
18
#include <Interpreters/Cluster.h>
19

20
#include <Common/getFQDNOrHostName.h>
21 22
#include <Common/setThreadName.h>
#include <Common/Stopwatch.h>
23 24 25 26 27 28 29

#include <DataTypes/DataTypesNumber.h>
#include <DataTypes/DataTypeString.h>
#include <DataTypes/DataTypeArray.h>
#include <Columns/ColumnsNumber.h>
#include <Columns/ColumnString.h>
#include <Columns/ColumnArray.h>
30

31 32
#include <Common/ZooKeeper/ZooKeeper.h>
#include <Common/ZooKeeper/Lock.h>
33 34
#include <Poco/Timestamp.h>

35 36
#include <experimental/optional>

37 38 39 40 41 42 43 44

namespace DB
{

namespace ErrorCodes
{
    extern const int UNKNOWN_ELEMENT_IN_CONFIG;
    extern const int INVALID_CONFIG_PARAMETER;
45
    extern const int UNKNOWN_FORMAT_VERSION;
46 47
    extern const int INCONSISTENT_TABLE_ACCROSS_SHARDS;
    extern const int INCONSISTENT_CLUSTER_DEFINITION;
48
    extern const int TIMEOUT_EXCEEDED;
49
    extern const int UNFINISHED;
50 51 52
}


53 54 55 56
const size_t DDLWorker::node_max_lifetime_seconds = 7 * 24 * 60 * 60; // week
const size_t DDLWorker::cleanup_min_period_seconds = 60; // minute


57 58 59 60
struct DDLLogEntry
{
    String query;
    Strings hosts;
61
    String initiator; // optional
62

63
    static constexpr int CURRENT_VERSION = 1;
64 65 66

    String toString()
    {
67 68 69 70 71 72 73 74 75
        WriteBufferFromOwnString wb;

        auto version = CURRENT_VERSION;
        wb << "version: " << version << "\n";
        wb << "query: " << escape << query << "\n";
        wb << "hosts: " << hosts << "\n";
        wb << "initiator: " << initiator << "\n";

        return wb.str();
76 77 78 79 80 81
    }

    void parse(const String & data)
    {
        ReadBufferFromString rb(data);

82 83 84
        int version;
        rb >> "version: " >> version >> "\n";

85
        if (version != CURRENT_VERSION)
86
            throw Exception("Unknown DDLLogEntry format version: " + DB::toString(version), ErrorCodes::UNKNOWN_FORMAT_VERSION);
87

88
        rb >> "query: " >> escape >> query >> "\n";
89
        rb >> "hosts: " >> hosts >> "\n";
90 91 92 93 94

        if (!rb.eof())
            rb >> "initiator: " >> initiator >> "\n";
        else
            initiator.clear();
95 96 97 98

        assertEOF(rb);
    }
};
99 100


101 102
using ShardAndHostNum = std::experimental::optional<std::pair<size_t, size_t>>;
static ShardAndHostNum tryGetShardAndHostNum(const Cluster::AddressesWithFailover & cluster, const String & host_name, UInt16 port)
103 104 105 106 107 108 109
{
    for (size_t shard_num = 0; shard_num < cluster.size(); ++shard_num)
    {
        for (size_t host_num = 0; host_num < cluster[shard_num].size(); ++host_num)
        {
            const Cluster::Address & address = cluster[shard_num][host_num];
            if (address.host_name == host_name && address.port == port)
110
                return std::make_pair(shard_num, host_num);
111 112 113
        }
    }

114
    return {};
115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
}


static bool isSupportedAlterType(int type)
{
    static const std::unordered_set<int> supported_alter_types{
        ASTAlterQuery::ADD_COLUMN,
        ASTAlterQuery::DROP_COLUMN,
        ASTAlterQuery::MODIFY_COLUMN,
        ASTAlterQuery::MODIFY_PRIMARY_KEY,
        ASTAlterQuery::DROP_PARTITION
    };

    return supported_alter_types.count(type);
}


132
DDLWorker::DDLWorker(const std::string & zk_root_dir, Context & context_)
133
    : context(context_)
134
{
135 136 137
    queue_dir = zk_root_dir;
    if (queue_dir.back() == '/')
        queue_dir.resize(queue_dir.size() - 1);
138

139 140
    host_name = getFQDNOrHostName();
    port = context.getTCPPort();
141
    host_id = Cluster::Address::toString(host_name, port);
142

143 144
    event_queue_updated = std::make_shared<Poco::Event>();

145 146 147
    thread = std::thread(&DDLWorker::run, this);
}

148

149 150 151
DDLWorker::~DDLWorker()
{
    stop_flag = true;
152
    event_queue_updated->set();
153 154 155
    thread.join();
}

156

157 158
void DDLWorker::processTasks()
{
159
    LOG_DEBUG(log, "Processing tasks");
160

161
    Strings queue_nodes = zookeeper->getChildren(queue_dir, nullptr, event_queue_updated);
162
    if (queue_nodes.empty())
163 164
        return;

165
    bool server_startup = last_processed_node_name.empty();
166

167 168 169 170
    std::sort(queue_nodes.begin(), queue_nodes.end());
    auto begin_node = server_startup
        ? queue_nodes.begin()
        : std::upper_bound(queue_nodes.begin(), queue_nodes.end(), last_processed_node_name);
171

172
    for (auto it = begin_node; it != queue_nodes.end(); ++it)
173
    {
174 175 176
        const String & node_name = *it;
        String node_path = queue_dir + "/" + node_name;
        String node_data;
177

178 179 180 181 182
        if (!zookeeper->tryGet(node_path, node_data))
        {
            /// It is Ok that node could be deleted just now. It means that there are no current host in node's host list.
            continue;
        }
183 184 185 186

        DDLLogEntry node;
        node.parse(node_data);

187
        bool host_in_hostlist = std::find(node.hosts.cbegin(), node.hosts.cend(), host_id) != node.hosts.cend();
188
        bool already_processed = zookeeper->exists(node_path + "/finished/" + host_id);
189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204

        if (!server_startup && already_processed)
        {
            throw Exception(
                "Server expects that DDL node " + node_name + " should be processed, but it was already processed according to ZK",
                ErrorCodes::LOGICAL_ERROR);
        }

        if (host_in_hostlist && !already_processed)
        {
            try
            {
                processTask(node, node_name);
            }
            catch (...)
            {
205
                tryLogCurrentException(log, "An error occurred while processing node " + node_name + " (" + node.query + ")");
206 207 208
                throw;
            }
        }
209 210 211 212
        else
        {
            LOG_DEBUG(log, "Node " << node_name << " (" << node.query << ") will not be processed");
        }
213 214

        last_processed_node_name = node_name;
215
    }
216 217
}

218

219
static bool tryExecuteQuery(const String & query, Context & context, ExecutionStatus & status, Logger * log = nullptr)
220 221 222 223 224 225 226
{
    try
    {
        executeQuery(query, context);
    }
    catch (...)
    {
227 228
        status = ExecutionStatus::fromCurrentException();

229 230 231 232 233 234
        if (log)
            tryLogCurrentException(log, "Query " + query + " wasn't finished successfully");

        return false;
    }

235
    status = ExecutionStatus(0);
236 237 238 239 240 241 242
    if (log)
        LOG_DEBUG(log, "Executed query: " << query);

    return true;
}


243
void DDLWorker::processTask(const DDLLogEntry & node, const std::string & node_name)
244
{
245
    LOG_DEBUG(log, "Processing node " << node_name << " (" << node.query << ")");
246

247
    String node_path = queue_dir + "/" + node_name;
248 249
    createStatusDirs(node_path);

250
    bool should_not_execute = current_node == node_name && current_node_was_executed;
251

252 253 254 255
    if (!should_not_execute)
    {
        current_node = node_name;
        current_node_was_executed = false;
256

257
        zookeeper->create(node_path + "/active/" + host_id, "", zkutil::CreateMode::Ephemeral);
258

259 260 261 262
        try
        {
            ASTPtr query_ast;
            {
263
                const char * begin = &node.query.front();
264 265
                ParserQuery parser_query(begin + node.query.size());
                String description;
266 267
                query_ast = parseQuery(parser_query, begin, begin + node.query.size(), description);
            }
268

269 270 271 272 273 274 275
            const ASTQueryWithOnCluster * query;
            if (!query_ast || !(query = dynamic_cast<const ASTQueryWithOnCluster *>(query_ast.get())))
                throw Exception("Recieved unsupported DDL query", ErrorCodes::NOT_IMPLEMENTED);

            String cluster_name = query->cluster;
            auto cluster = context.getCluster(cluster_name);

276
            auto shard_host_num = tryGetShardAndHostNum(cluster->getShardsAddresses(), host_name, port);
277
            if (!shard_host_num)
278 279 280 281
            {
                throw Exception("Cannot find own address (" + host_id + ") in cluster " + cluster_name + " configuration",
                                ErrorCodes::INCONSISTENT_CLUSTER_DEFINITION);
            }
282

283 284 285
            size_t shard_num = shard_host_num->first;
            size_t host_num = shard_host_num->second;

286
            const auto & host_address = cluster->getShardsAddresses().at(shard_num).at(host_num);
287 288
            ASTPtr rewritten_ast = query->getRewrittenASTWithoutOnCluster(host_address.default_database);
            String rewritten_query = queryToString(rewritten_ast);
289

290
            LOG_DEBUG(log, "Executing query: " << rewritten_query);
291

292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311
            if (auto query_alter = dynamic_cast<const ASTAlterQuery *>(rewritten_ast.get()))
            {
                processTaskAlter(query_alter, rewritten_query, cluster, shard_num, node_path);
            }
            else
            {
                tryExecuteQuery(rewritten_query, context, current_node_execution_status, log);
            }
        }
        catch (const zkutil::KeeperException & e)
        {
            throw;
        }
        catch (...)
        {
            current_node_execution_status = ExecutionStatus::fromCurrentException("An error occured during query preparation");
        }

        /// We need to distinguish ZK errors occured before and after query executing
        current_node_was_executed = true;
312 313
    }

314 315 316 317 318
    /// Delete active flag and create finish flag
    zkutil::Ops ops;
    ops.emplace_back(std::make_unique<zkutil::Op::Remove>(node_path + "/active/" + host_id, -1));
    ops.emplace_back(std::make_unique<zkutil::Op::Create>(node_path + "/finished/" + host_id,
        current_node_execution_status.serializeText(), zookeeper->getDefaultACL(), zkutil::CreateMode::Persistent));
319

320 321 322 323
    int code = zookeeper->tryMultiWithRetries(ops);
    if (code != ZOK && code != ZNONODE)
        throw zkutil::KeeperException("Cannot commit executed node " + node_name, code);
}
324 325


326 327 328 329 330 331 332 333 334
void DDLWorker::processTaskAlter(
    const ASTAlterQuery * query_alter,
    const String & rewritten_query,
    const std::shared_ptr<Cluster> & cluster,
    ssize_t shard_num,
    const String & node_path)
{
    String database = query_alter->database.empty() ? context.getCurrentDatabase() : query_alter->database;
    StoragePtr storage = context.getTable(database, query_alter->table);
335

336 337
    bool execute_once_on_replica = storage->supportsReplication();
    bool execute_on_leader_replica = false;
338

339
    for (const auto & param : query_alter->parameters)
340
    {
341 342
        if (!isSupportedAlterType(param.type))
            throw Exception("Unsupported type of ALTER query", ErrorCodes::NOT_IMPLEMENTED);
343

344 345 346
        if (execute_once_on_replica)
            execute_on_leader_replica |= param.type == ASTAlterQuery::DROP_PARTITION;
    }
347

348 349
    const auto & shard_info = cluster->getShardsInfo().at(shard_num);
    bool config_is_replicated_shard = shard_info.hasInternalReplication();
350

351 352 353 354 355 356 357 358 359 360
    if (execute_once_on_replica && !config_is_replicated_shard)
    {
        throw Exception("Table " + query_alter->table + " is replicated, but shard #" + toString(shard_num + 1) +
            " isn't replicated according to its cluster definition", ErrorCodes::INCONSISTENT_CLUSTER_DEFINITION);
    }
    else if (!execute_once_on_replica && config_is_replicated_shard)
    {
        throw Exception("Table " + query_alter->table + " isn't replicated, but shard #" + toString(shard_num + 1) +
            " replicated according to its cluster definition", ErrorCodes::INCONSISTENT_CLUSTER_DEFINITION);
    }
361

362 363
    if (execute_once_on_replica)
    {
364 365 366 367
        /// The following code may perform ALTER twice if
        ///  current secver aquires lock, executes replicated alter,
        ///  losts zookeeper connection and doesn't have time to create /executed node, second server executes replicated alter again
        /// To avoid this problem alter() method of replicated tables should be changed and takes into account ddl query id tag.
368 369
        if (!context.getSettingsRef().distributed_ddl_allow_replicated_alter)
            throw Exception("Distributed DDL alters don't work properly yet", ErrorCodes::NOT_IMPLEMENTED);
370

371
        Strings replica_names;
372
        for (const auto & address : cluster->getShardsAddresses().at(shard_num))
373 374
            replica_names.emplace_back(address.toString());
        std::sort(replica_names.begin(), replica_names.end());
375

376 377 378
        String shard_dir_name;
        for (auto it = replica_names.begin(); it != replica_names.end(); ++it)
            shard_dir_name += *it + (std::next(it) != replica_names.end() ? "," : "");
379

380 381 382
        String shard_path = node_path + "/shards/" + shard_dir_name;
        String is_executed_path = shard_path + "/executed";
        zookeeper->createAncestors(shard_path + "/");
383

384 385 386 387
        bool alter_executed_by_replica = false;
        {
            auto zookeeper_holder = std::make_shared<zkutil::ZooKeeperHolder>();
            zookeeper_holder->initFromInstance(zookeeper);
388

389 390 391 392
            zkutil::Lock lock(zookeeper_holder, shard_path, "lock", host_id);
            std::mt19937 rng(std::hash<String>{}(host_id) + reinterpret_cast<intptr_t>(&rng));

            for (int num_tries = 0; num_tries < 10; ++num_tries)
393
            {
394 395 396 397 398
                if (zookeeper->exists(is_executed_path))
                {
                    alter_executed_by_replica = true;
                    break;
                }
399

400
                if (lock.tryLock())
401
                {
402
                    tryExecuteQuery(rewritten_query, context, current_node_execution_status, log);
403

404
                    if (execute_on_leader_replica && current_node_execution_status.code == ErrorCodes::NOT_IMPLEMENTED)
405
                    {
406
                        /// TODO: it is ok to recieve exception "host is not leader"
407 408
                    }

409 410 411 412
                    zookeeper->create(is_executed_path, host_id, zkutil::CreateMode::Persistent);
                    lock.unlock();
                    alter_executed_by_replica = true;
                    break;
413 414
                }

415
                std::this_thread::sleep_for(std::chrono::duration<double>(std::uniform_real_distribution<double>(0, 1)(rng)));
416 417
            }
        }
418 419 420

        if (!alter_executed_by_replica)
            current_node_execution_status = ExecutionStatus(ErrorCodes::NOT_IMPLEMENTED, "Cannot enqueue replicated DDL query");
421 422 423
    }
    else
    {
424
        tryExecuteQuery(rewritten_query, context, current_node_execution_status, log);
425 426 427 428
    }
}


429 430 431 432 433 434 435
void DDLWorker::cleanupQueue(const Strings * node_names_to_check)
{
    /// Both ZK and Poco use Unix epoch
    size_t current_time_seconds = Poco::Timestamp().epochTime();
    constexpr size_t zookeeper_time_resolution = 1000;

    // Too early to check
436
    if (last_cleanup_time_seconds && current_time_seconds < last_cleanup_time_seconds + cleanup_min_period_seconds)
437 438 439 440
        return;

    last_cleanup_time_seconds = current_time_seconds;

441 442
    LOG_DEBUG(log, "Cleaning queue");

443 444 445 446
    String data;
    zkutil::Stat stat;
    DDLLogEntry node;

447
    Strings node_names_fetched = node_names_to_check ? Strings{} : zookeeper->getChildren(queue_dir);
448 449 450 451 452 453
    const Strings & node_names = (node_names_to_check) ? *node_names_to_check : node_names_fetched;

    for (const String & node_name : node_names)
    {
        try
        {
454
            String node_path = queue_dir + "/" + node_name;
455 456 457
            if (!zookeeper->tryGet(node_path, data, &stat))
                continue;

458
            /// TODO: Add shared lock to avoid rare race counditions.
459 460 461 462 463 464 465 466 467 468

            size_t zookeeper_time_seconds = stat.mtime / zookeeper_time_resolution;
            if (zookeeper_time_seconds + node_max_lifetime_seconds < current_time_seconds)
            {
                size_t lifetime_seconds = current_time_seconds - zookeeper_time_seconds;
                LOG_INFO(log, "Lifetime of node " << node_name << " (" << lifetime_seconds << " sec.) is expired, deleting it");
                zookeeper->removeRecursive(node_path);
                continue;
            }

469
            Strings finished_nodes = zookeeper->getChildren(node_path + "/finished");
470 471
            node.parse(data);

472
            if (finished_nodes.size() >= node.hosts.size())
473 474 475 476 477 478 479 480 481 482 483 484
            {
                LOG_INFO(log, "Node " << node_name << " had been executed by each host, deleting it");
                zookeeper->removeRecursive(node_path);
            }
        }
        catch (...)
        {
            tryLogCurrentException(log, "An error occured while checking and cleaning node " + node_name + " from queue");
        }
    }
}

485

486 487
/// Try to create unexisting "status" dirs for a node
void DDLWorker::createStatusDirs(const std::string & node_path)
488
{
489
    zkutil::Ops ops;
490
    auto acl = zookeeper->getDefaultACL();
491
    ops.emplace_back(std::make_unique<zkutil::Op::Create>(node_path + "/active", "", acl, zkutil::CreateMode::Persistent));
492
    ops.emplace_back(std::make_unique<zkutil::Op::Create>(node_path + "/finished", "", acl, zkutil::CreateMode::Persistent));
493

494 495 496 497
    int code = zookeeper->tryMulti(ops);
    if (code != ZOK && code != ZNODEEXISTS)
        throw zkutil::KeeperException(code);
}
498 499


500
String DDLWorker::enqueueQuery(DDLLogEntry & entry)
501
{
502
    if (entry.hosts.empty())
503
        return {};
504

505
    String query_path_prefix = queue_dir + "/query-";
506
    zookeeper->createAncestors(query_path_prefix);
507

508 509
    String node_path = zookeeper->create(query_path_prefix, entry.toString(), zkutil::CreateMode::PersistentSequential);
    createStatusDirs(node_path);
510 511

    return node_path;
512 513
}

514

515 516
void DDLWorker::run()
{
517
    setThreadName("DDLWorker");
518 519
    LOG_DEBUG(log, "Started DDLWorker thread");

520 521 522
    zookeeper = context.getZooKeeper();
    zookeeper->createAncestors(queue_dir + "/");

523 524 525 526
    while (!stop_flag)
    {
        try
        {
527
            processTasks();
528

529 530 531 532 533
            LOG_DEBUG(log, "Waiting watch");
            event_queue_updated->wait();

            if (stop_flag)
                break;
534 535

            cleanupQueue();
536
        }
537 538 539 540 541
        catch (zkutil::KeeperException &)
        {
            LOG_DEBUG(log, "Recovering ZooKeeper session");
            zookeeper = context.getZooKeeper();
        }
542 543 544
        catch (...)
        {
            tryLogCurrentException(log);
545
            throw;
546
        }
547 548 549
    }
}

550

551
class DDLQueryStatusInputSream : public IProfilingBlockInputStream
552
{
553
public:
554

555
    DDLQueryStatusInputSream(const String & zk_node_path, Context & context, size_t num_hosts)
556
    : node_path(zk_node_path), context(context), watch(CLOCK_MONOTONIC_COARSE)
557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578
    {
        sample = Block{
            {std::make_shared<DataTypeString>(),    "host"},
            {std::make_shared<DataTypeUInt64>(),    "status"},
            {std::make_shared<DataTypeString>(),    "error"},
            {std::make_shared<DataTypeUInt64>(),    "num_hosts_remaining"},
            {std::make_shared<DataTypeUInt64>(),    "num_hosts_active"},
        };

        setTotalRowsApprox(num_hosts);
    }

    String getName() const override
    {
        return "DDLQueryStatusInputSream";
    }

    String getID() const override
    {
        return "DDLQueryStatusInputSream(" + node_path + ")";
    }

579 580
    static constexpr size_t timeout_seconds = 120;

581 582 583 584 585 586 587 588 589 590 591 592 593 594
    Block readImpl() override
    {
        Block res;
        if (num_hosts_finished >= total_rows_approx)
            return res;

        auto zookeeper = context.getZooKeeper();
        size_t try_number = 0;

        while(res.rows() == 0)
        {
            if (is_cancelled)
                return res;

595 596
            auto elapsed_seconds = watch.elapsedSeconds();
            if (elapsed_seconds > timeout_seconds)
597
                throw Exception("Watching query is executing too long (" + toString(std::round(elapsed_seconds)) + " sec.)", ErrorCodes::TIMEOUT_EXCEEDED);
598

599
            if (num_hosts_finished != 0 || try_number != 0)
600
                std::this_thread::sleep_for(std::chrono::milliseconds(50 * std::min(20LU, try_number + 1)));
601

602
            /// TODO: add shared lock
603
            if (!zookeeper->exists(node_path))
604 605 606 607 608
            {
                throw Exception("Cannot provide query execution status. The query's node " + node_path
                                + " had been deleted by cleaner since it was finished (or its lifetime is expired)",
                                ErrorCodes::UNFINISHED);
            }
609

610
            Strings new_hosts = getNewAndUpdate(finished_hosts_set, getChildrenAllowNoNode(zookeeper, node_path + "/finished"));
611 612 613 614
            ++try_number;
            if (new_hosts.empty())
                continue;

615 616
            Strings cur_active_hosts = getChildrenAllowNoNode(zookeeper, node_path + "/active");

617
            res = sample.cloneEmpty();
618
            for (const String & host : new_hosts)
619
            {
620 621 622 623 624 625 626 627 628 629
                ExecutionStatus status(1, "Cannot obtain error message");
                {
                    String status_data;
                    if (zookeeper->tryGet(node_path + "/finished/" + host, status_data))
                        status.deserializeText(status_data);
                }

                res.getByName("host").column->insert(host);
                res.getByName("status").column->insert(static_cast<UInt64>(status.code));
                res.getByName("error").column->insert(status.message);
630
                res.getByName("num_hosts_remaining").column->insert(total_rows_approx - (++num_hosts_finished));
631
                res.getByName("num_hosts_active").column->insert(cur_active_hosts.size());
632 633
            }
        }
634

635 636 637
        return res;
    }

638 639 640 641 642 643 644 645 646 647
    static Strings getChildrenAllowNoNode(const std::shared_ptr<zkutil::ZooKeeper> & zookeeper, const String & node_path)
    {
        Strings res;
        int code = zookeeper->tryGetChildren(node_path, res);
        if (code != ZOK && code != ZNONODE)
            throw zkutil::KeeperException(code, node_path);
        return res;
    }

    static Strings getNewAndUpdate(NameSet & prev, const Strings & cur_list)
648 649 650 651 652
    {
        Strings diff;
        for (const String & elem : cur_list)
        {
            if (!prev.count(elem))
653
            {
654
                diff.emplace_back(elem);
655 656
                prev.emplace(elem);
            }
657 658 659 660 661 662 663 664 665 666 667 668 669
        }

        return diff;
    }

    ~DDLQueryStatusInputSream() override = default;

    Block sample;

private:
    String node_path;
    Context & context;

670 671 672
    Stopwatch watch;

    NameSet finished_hosts_set;
673
    size_t num_hosts_finished = 0;
674
};
675 676


677
BlockIO executeDDLQueryOnCluster(const ASTPtr & query_ptr, Context & context)
678
{
679 680 681 682 683 684
    const auto query = dynamic_cast<const ASTQueryWithOnCluster *>(query_ptr.get());
    if (!query)
    {
        throw Exception("Distributed execution is not supported for such DDL queries",
                        ErrorCodes::NOT_IMPLEMENTED);
    }
685

686 687 688 689 690 691 692 693 694 695 696 697
    auto query_alter = dynamic_cast<const ASTAlterQuery *>(query_ptr.get());
    if (query_alter)
    {
        for (const auto & param : query_alter->parameters)
        {
            if (!isSupportedAlterType(param.type))
                throw Exception("Unsupported type of ALTER query", ErrorCodes::NOT_IMPLEMENTED);
        }
    }

    ClusterPtr cluster = context.getCluster(query->cluster);
    DDLWorker & ddl_worker = context.getDDLWorker();
698

699
    DDLLogEntry entry;
700
    entry.query = queryToString(query_ptr);
701 702
    entry.initiator = ddl_worker.getHostName();

703
    Cluster::AddressesWithFailover shards = cluster->getShardsAddresses();
704
    for (const auto & shard : shards)
705
    {
706
        for (const auto & addr : shard)
707
            entry.hosts.emplace_back(addr.toString());
708
    }
709

710
    String node_path = ddl_worker.enqueueQuery(entry);
711 712

    BlockIO io;
713 714 715 716 717 718
    if (node_path.empty())
        return io;

    auto stream = std::make_shared<DDLQueryStatusInputSream>(node_path, context, entry.hosts.size());
    io.in_sample = stream->sample.cloneEmpty();
    io.in = std::move(stream);
719 720 721 722
    return io;
}


723
}