virnetsocket.c 53.1 KB
Newer Older
1 2 3
/*
 * virnetsocket.c: generic network socket handling
 *
4
 * Copyright (C) 2006-2014 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22 23 24 25 26 27 28 29
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

#include <config.h>

#include <sys/stat.h>
#include <sys/socket.h>
#include <unistd.h>
#include <sys/wait.h>
30
#include <signal.h>
31
#include <fcntl.h>
32
#include <netdb.h>
33 34 35 36 37

#ifdef HAVE_NETINET_TCP_H
# include <netinet/tcp.h>
#endif

38 39 40 41
#ifdef HAVE_SYS_UCRED_H
# include <sys/ucred.h>
#endif

42
#include "c-ctype.h"
43
#ifdef WITH_SELINUX
44 45 46
# include <selinux/selinux.h>
#endif

47
#include "virnetsocket.h"
48
#include "virutil.h"
49
#include "viralloc.h"
50
#include "virerror.h"
51
#include "virlog.h"
E
Eric Blake 已提交
52
#include "virfile.h"
53
#include "virthread.h"
54
#include "virprobe.h"
55
#include "virprocess.h"
56
#include "virstring.h"
57 58
#include "passfd.h"

59
#if WITH_SSH2
60 61 62
# include "virnetsshsession.h"
#endif

63 64
#define VIR_FROM_THIS VIR_FROM_RPC

65
VIR_LOG_INIT("rpc.netsocket");
66 67

struct _virNetSocket {
68
    virObjectLockable parent;
69

70 71 72 73 74
    int fd;
    int watch;
    pid_t pid;
    int errfd;
    bool client;
75 76

    /* Event callback fields */
77 78
    virNetSocketIOFunc func;
    void *opaque;
79 80
    virFreeCallback ff;

81 82 83 84
    virSocketAddr localAddr;
    virSocketAddr remoteAddr;
    char *localAddrStr;
    char *remoteAddrStr;
85

86
#if WITH_GNUTLS
87
    virNetTLSSessionPtr tlsSession;
88
#endif
89
#if WITH_SASL
90 91 92 93 94 95 96 97 98 99
    virNetSASLSessionPtr saslSession;

    const char *saslDecoded;
    size_t saslDecodedLength;
    size_t saslDecodedOffset;

    const char *saslEncoded;
    size_t saslEncodedLength;
    size_t saslEncodedOffset;
#endif
100
#if WITH_SSH2
101 102
    virNetSSHSessionPtr sshSession;
#endif
103 104 105
};


106 107 108 109 110
static virClassPtr virNetSocketClass;
static void virNetSocketDispose(void *obj);

static int virNetSocketOnceInit(void)
{
111
    if (!(virNetSocketClass = virClassNew(virClassForObjectLockable(),
112
                                          "virNetSocket",
113 114 115 116 117 118 119 120 121 122
                                          sizeof(virNetSocket),
                                          virNetSocketDispose)))
        return -1;

    return 0;
}

VIR_ONCE_GLOBAL_INIT(virNetSocket)


123
#ifndef WIN32
124
static int virNetSocketForkDaemon(const char *binary, int passfd)
125 126 127 128 129 130 131
{
    int ret;
    virCommandPtr cmd = virCommandNewArgList(binary,
                                             "--timeout=30",
                                             NULL);

    virCommandAddEnvPassCommon(cmd);
132 133 134
    virCommandAddEnvPassBlockSUID(cmd, "XDG_CACHE_HOME", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "XDG_CONFIG_HOME", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "XDG_RUNTIME_DIR", NULL);
135 136
    virCommandClearCaps(cmd);
    virCommandDaemonize(cmd);
137 138 139 140
    if (passfd) {
        virCommandPassFD(cmd, passfd, VIR_COMMAND_PASS_FD_CLOSE_PARENT);
        virCommandPassListenFDs(cmd);
    }
141 142 143 144 145 146 147 148 149 150 151 152 153 154 155
    ret = virCommandRun(cmd, NULL);
    virCommandFree(cmd);
    return ret;
}
#endif


static virNetSocketPtr virNetSocketNew(virSocketAddrPtr localAddr,
                                       virSocketAddrPtr remoteAddr,
                                       bool isClient,
                                       int fd, int errfd, pid_t pid)
{
    virNetSocketPtr sock;
    int no_slow_start = 1;

156 157 158
    if (virNetSocketInitialize() < 0)
        return NULL;

E
Eric Blake 已提交
159
    VIR_DEBUG("localAddr=%p remoteAddr=%p fd=%d errfd=%d pid=%lld",
160
              localAddr, remoteAddr,
E
Eric Blake 已提交
161
              fd, errfd, (long long) pid);
162 163 164 165 166 167 168 169 170 171 172 173

    if (virSetCloseExec(fd) < 0) {
        virReportSystemError(errno, "%s",
                             _("Unable to set close-on-exec flag"));
       return NULL;
    }
    if (virSetNonBlock(fd) < 0) {
        virReportSystemError(errno, "%s",
                             _("Unable to enable non-blocking flag"));
        return NULL;
    }

174
    if (!(sock = virObjectLockableNew(virNetSocketClass)))
175 176
        return NULL;

177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
    if (localAddr)
        sock->localAddr = *localAddr;
    if (remoteAddr)
        sock->remoteAddr = *remoteAddr;
    sock->fd = fd;
    sock->errfd = errfd;
    sock->pid = pid;

    /* Disable nagle for TCP sockets */
    if (sock->localAddr.data.sa.sa_family == AF_INET ||
        sock->localAddr.data.sa.sa_family == AF_INET6) {
        if (setsockopt(fd, IPPROTO_TCP, TCP_NODELAY,
                       &no_slow_start,
                       sizeof(no_slow_start)) < 0) {
            virReportSystemError(errno, "%s",
                                 _("Unable to disable nagle algorithm"));
            goto error;
        }
    }


    if (localAddr &&
199
        !(sock->localAddrStr = virSocketAddrFormatFull(localAddr, true, ";")))
200 201 202
        goto error;

    if (remoteAddr &&
203
        !(sock->remoteAddrStr = virSocketAddrFormatFull(remoteAddr, true, ";")))
204 205 206 207
        goto error;

    sock->client = isClient;

208
    PROBE(RPC_SOCKET_NEW,
209 210
          "sock=%p fd=%d errfd=%d pid=%lld localAddr=%s, remoteAddr=%s",
          sock, fd, errfd, (long long) pid,
E
Eric Blake 已提交
211
          NULLSTR(sock->localAddrStr), NULLSTR(sock->remoteAddrStr));
212 213 214

    return sock;

215
 error:
216
    sock->fd = sock->errfd = -1; /* Caller owns fd/errfd on failure */
217
    virObjectUnref(sock);
218 219 220 221 222 223 224 225 226 227 228 229 230 231
    return NULL;
}


int virNetSocketNewListenTCP(const char *nodename,
                             const char *service,
                             virNetSocketPtr **retsocks,
                             size_t *nretsocks)
{
    virNetSocketPtr *socks = NULL;
    size_t nsocks = 0;
    struct addrinfo *ai = NULL;
    struct addrinfo hints;
    int fd = -1;
232
    size_t i;
233 234 235
    bool addrInUse = false;
    bool familyNotSupported = false;
    virSocketAddr tmp_addr;
236 237 238 239

    *retsocks = NULL;
    *nretsocks = 0;

240
    memset(&hints, 0, sizeof(hints));
241
    hints.ai_flags = AI_PASSIVE;
242 243
    hints.ai_socktype = SOCK_STREAM;

244 245 246 247 248 249 250 251 252 253 254 255
    /* Don't use ADDRCONFIG for binding to the wildcard address.
     * Just catch the error returned by socket() if the system has
     * no IPv6 support.
     *
     * This allows libvirtd to be started in parallel with the network
     * startup in most cases.
     */
    if (nodename &&
        !(virSocketAddrParse(&tmp_addr, nodename, AF_UNSPEC) > 0 &&
          virSocketAddrIsWildcard(&tmp_addr)))
        hints.ai_flags |= AI_ADDRCONFIG;

256 257
    int e = getaddrinfo(nodename, service, &hints, &ai);
    if (e != 0) {
258 259 260
        virReportError(VIR_ERR_SYSTEM_ERROR,
                       _("Unable to resolve address '%s' service '%s': %s"),
                       nodename, service, gai_strerror(e));
261 262 263 264 265 266 267 268 269 270 271
        return -1;
    }

    struct addrinfo *runp = ai;
    while (runp) {
        virSocketAddr addr;

        memset(&addr, 0, sizeof(addr));

        if ((fd = socket(runp->ai_family, runp->ai_socktype,
                         runp->ai_protocol)) < 0) {
272 273 274 275 276
            if (errno == EAFNOSUPPORT) {
                familyNotSupported = true;
                runp = runp->ai_next;
                continue;
            }
277 278 279 280
            virReportSystemError(errno, "%s", _("Unable to create socket"));
            goto error;
        }

281
        if (virSetSockReuseAddr(fd) < 0) {
282 283 284 285 286 287 288 289 290 291 292 293 294 295 296
            virReportSystemError(errno, "%s", _("Unable to enable port reuse"));
            goto error;
        }

#ifdef IPV6_V6ONLY
        if (runp->ai_family == PF_INET6) {
            int on = 1;
            /*
             * Normally on Linux an INET6 socket will bind to the INET4
             * address too. If getaddrinfo returns results with INET4
             * first though, this will result in INET6 binding failing.
             * We can trivially cope with multiple server sockets, so
             * we force it to only listen on IPv6
             */
            if (setsockopt(fd, IPPROTO_IPV6, IPV6_V6ONLY,
297
                           (void*)&on, sizeof(on)) < 0) {
298 299 300 301 302 303 304 305 306 307 308 309
                virReportSystemError(errno, "%s",
                                     _("Unable to force bind to IPv6 only"));
                goto error;
            }
        }
#endif

        if (bind(fd, runp->ai_addr, runp->ai_addrlen) < 0) {
            if (errno != EADDRINUSE) {
                virReportSystemError(errno, "%s", _("Unable to bind to port"));
                goto error;
            }
310
            addrInUse = true;
311
            VIR_FORCE_CLOSE(fd);
312
            runp = runp->ai_next;
313 314 315 316 317 318 319 320 321 322 323
            continue;
        }

        addr.len = sizeof(addr.data);
        if (getsockname(fd, &addr.data.sa, &addr.len) < 0) {
            virReportSystemError(errno, "%s", _("Unable to get local socket name"));
            goto error;
        }

        VIR_DEBUG("%p f=%d f=%d", &addr, runp->ai_family, addr.data.sa.sa_family);

324
        if (VIR_EXPAND_N(socks, nsocks, 1) < 0)
325 326 327 328 329 330 331 332
            goto error;

        if (!(socks[nsocks-1] = virNetSocketNew(&addr, NULL, false, fd, -1, 0)))
            goto error;
        runp = runp->ai_next;
        fd = -1;
    }

333 334 335 336 337
    if (nsocks == 0 && familyNotSupported) {
        virReportSystemError(EAFNOSUPPORT, "%s", _("Unable to bind to port"));
        goto error;
    }

338 339 340 341 342 343
    if (nsocks == 0 &&
        addrInUse) {
        virReportSystemError(EADDRINUSE, "%s", _("Unable to bind to port"));
        goto error;
    }

344 345 346 347 348 349
    freeaddrinfo(ai);

    *retsocks = socks;
    *nretsocks = nsocks;
    return 0;

350
 error:
351
    for (i = 0; i < nsocks; i++)
352
        virObjectUnref(socks[i]);
353 354 355 356 357 358 359 360 361 362
    VIR_FREE(socks);
    freeaddrinfo(ai);
    VIR_FORCE_CLOSE(fd);
    return -1;
}


#if HAVE_SYS_UN_H
int virNetSocketNewListenUNIX(const char *path,
                              mode_t mask,
363
                              uid_t user,
364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383
                              gid_t grp,
                              virNetSocketPtr *retsock)
{
    virSocketAddr addr;
    mode_t oldmask;
    int fd;

    *retsock = NULL;

    memset(&addr, 0, sizeof(addr));

    addr.len = sizeof(addr.data.un);

    if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
        virReportSystemError(errno, "%s", _("Failed to create socket"));
        goto error;
    }

    addr.data.un.sun_family = AF_UNIX;
    if (virStrcpyStatic(addr.data.un.sun_path, path) == NULL) {
384 385
        virReportSystemError(ENAMETOOLONG,
                             _("Path %s too long for unix socket"), path);
386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406
        goto error;
    }
    if (addr.data.un.sun_path[0] == '@')
        addr.data.un.sun_path[0] = '\0';
    else
        unlink(addr.data.un.sun_path);

    oldmask = umask(~mask);

    if (bind(fd, &addr.data.sa, addr.len) < 0) {
        umask(oldmask);
        virReportSystemError(errno,
                             _("Failed to bind socket to '%s'"),
                             path);
        goto error;
    }
    umask(oldmask);

    /* chown() doesn't work for abstract sockets but we use them only
     * if libvirtd runs unprivileged
     */
407
    if (grp != 0 && chown(path, user, grp)) {
408
        virReportSystemError(errno,
409 410
                             _("Failed to change ownership of '%s' to %d:%d"),
                             path, (int) user, (int) grp);
411 412 413 414 415 416 417 418
        goto error;
    }

    if (!(*retsock = virNetSocketNew(&addr, NULL, false, fd, -1, 0)))
        goto error;

    return 0;

419
 error:
420 421 422 423 424 425 426 427
    if (path[0] != '@')
        unlink(path);
    VIR_FORCE_CLOSE(fd);
    return -1;
}
#else
int virNetSocketNewListenUNIX(const char *path ATTRIBUTE_UNUSED,
                              mode_t mask ATTRIBUTE_UNUSED,
E
Eric Blake 已提交
428
                              uid_t user ATTRIBUTE_UNUSED,
429 430 431 432 433 434 435 436 437
                              gid_t grp ATTRIBUTE_UNUSED,
                              virNetSocketPtr *retsock ATTRIBUTE_UNUSED)
{
    virReportSystemError(ENOSYS, "%s",
                         _("UNIX sockets are not supported on this platform"));
    return -1;
}
#endif

438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457
int virNetSocketNewListenFD(int fd,
                            virNetSocketPtr *retsock)
{
    virSocketAddr addr;
    *retsock = NULL;

    memset(&addr, 0, sizeof(addr));

    addr.len = sizeof(addr.data);
    if (getsockname(fd, &addr.data.sa, &addr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
        return -1;
    }

    if (!(*retsock = virNetSocketNew(&addr, NULL, false, fd, -1, 0)))
        return -1;

    return 0;
}

458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475

int virNetSocketNewConnectTCP(const char *nodename,
                              const char *service,
                              virNetSocketPtr *retsock)
{
    struct addrinfo *ai = NULL;
    struct addrinfo hints;
    int fd = -1;
    virSocketAddr localAddr;
    virSocketAddr remoteAddr;
    struct addrinfo *runp;
    int savedErrno = ENOENT;

    *retsock = NULL;

    memset(&localAddr, 0, sizeof(localAddr));
    memset(&remoteAddr, 0, sizeof(remoteAddr));

476
    memset(&hints, 0, sizeof(hints));
477 478 479 480 481
    hints.ai_flags = AI_PASSIVE | AI_ADDRCONFIG;
    hints.ai_socktype = SOCK_STREAM;

    int e = getaddrinfo(nodename, service, &hints, &ai);
    if (e != 0) {
482 483
        virReportError(VIR_ERR_SYSTEM_ERROR,
                       _("Unable to resolve address '%s' service '%s': %s"),
484
                       nodename, service, gai_strerror(e));
485 486 487 488 489 490 491 492 493 494 495
        return -1;
    }

    runp = ai;
    while (runp) {
        if ((fd = socket(runp->ai_family, runp->ai_socktype,
                         runp->ai_protocol)) < 0) {
            virReportSystemError(errno, "%s", _("Unable to create socket"));
            goto error;
        }

496
        if (virSetSockReuseAddr(fd) < 0) {
497 498
            VIR_WARN("Unable to enable port reuse");
        }
499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533

        if (connect(fd, runp->ai_addr, runp->ai_addrlen) >= 0)
            break;

        savedErrno = errno;
        VIR_FORCE_CLOSE(fd);
        runp = runp->ai_next;
    }

    if (fd == -1) {
        virReportSystemError(savedErrno,
                             _("unable to connect to server at '%s:%s'"),
                             nodename, service);
        goto error;
    }

    localAddr.len = sizeof(localAddr.data);
    if (getsockname(fd, &localAddr.data.sa, &localAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
        goto error;
    }

    remoteAddr.len = sizeof(remoteAddr.data);
    if (getpeername(fd, &remoteAddr.data.sa, &remoteAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get remote socket name"));
        goto error;
    }

    if (!(*retsock = virNetSocketNew(&localAddr, &remoteAddr, true, fd, -1, 0)))
        goto error;

    freeaddrinfo(ai);

    return 0;

534
 error:
535 536 537 538 539 540
    freeaddrinfo(ai);
    VIR_FORCE_CLOSE(fd);
    return -1;
}


541
#ifdef HAVE_SYS_UN_H
542 543 544 545 546
int virNetSocketNewConnectUNIX(const char *path,
                               bool spawnDaemon,
                               const char *binary,
                               virNetSocketPtr *retsock)
{
547
    int fd, passfd = -1;
548 549 550 551 552 553 554 555
    virSocketAddr localAddr;
    virSocketAddr remoteAddr;

    memset(&localAddr, 0, sizeof(localAddr));
    memset(&remoteAddr, 0, sizeof(remoteAddr));

    remoteAddr.len = sizeof(remoteAddr.data.un);

556
    if (spawnDaemon && !binary) {
557
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
558
                       _("Auto-spawn of daemon requested, but no binary specified"));
559 560 561
        return -1;
    }

562 563 564 565 566 567 568 569 570 571 572 573 574
    if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
        virReportSystemError(errno, "%s", _("Failed to create socket"));
        goto error;
    }

    remoteAddr.data.un.sun_family = AF_UNIX;
    if (virStrcpyStatic(remoteAddr.data.un.sun_path, path) == NULL) {
        virReportSystemError(ENOMEM, _("Path %s too long for unix socket"), path);
        goto error;
    }
    if (remoteAddr.data.un.sun_path[0] == '@')
        remoteAddr.data.un.sun_path[0] = '\0';

575
 retry:
576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607
    if (connect(fd, &remoteAddr.data.sa, remoteAddr.len) < 0 && !spawnDaemon) {
        virReportSystemError(errno, _("Failed to connect socket to '%s'"),
                             path);
        goto error;
    } else if (spawnDaemon) {
        int status = 0;
        pid_t pid = 0;

        if ((passfd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
            virReportSystemError(errno, "%s", _("Failed to create socket"));
            goto error;
        }

        /*
         * We have to fork() here, because umask() is set
         * per-process, chmod() is racy and fchmod() has undefined
         * behaviour on sockets according to POSIX, so it doesn't
         * work outside Linux.
         */
        if ((pid = virFork()) < 0)
            goto error;

        if (pid == 0) {
            umask(0077);
            if (bind(passfd, &remoteAddr.data.sa, remoteAddr.len) < 0)
                _exit(EXIT_FAILURE);

            _exit(EXIT_SUCCESS);
        }

        if (virProcessWait(pid, &status, false) < 0)
            goto error;
608

609 610 611 612 613 614 615 616
        if (status != EXIT_SUCCESS) {
            /*
             * OK, so the subprocces failed to bind() the socket.  This may mean
             * that another daemon was starting at the same time and succeeded
             * with its bind().  So we'll try connecting again, but this time
             * without spawning the daemon.
             */
            spawnDaemon = false;
617 618 619
            goto retry;
        }

620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
        if (listen(passfd, 0) < 0) {
            virReportSystemError(errno, "%s",
                                 _("Failed to listen on socket that's about "
                                   "to be passed to the daemon"));
            goto error;
        }

        if (connect(fd, &remoteAddr.data.sa, remoteAddr.len) < 0) {
            virReportSystemError(errno, _("Failed to connect socket to '%s'"),
                                 path);
            goto error;
        }

        if (virNetSocketForkDaemon(binary, passfd) < 0)
            goto error;
635 636 637 638 639 640 641 642 643 644 645 646 647
    }

    localAddr.len = sizeof(localAddr.data);
    if (getsockname(fd, &localAddr.data.sa, &localAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
        goto error;
    }

    if (!(*retsock = virNetSocketNew(&localAddr, &remoteAddr, true, fd, -1, 0)))
        goto error;

    return 0;

648
 error:
649
    VIR_FORCE_CLOSE(fd);
650
    VIR_FORCE_CLOSE(passfd);
651 652
    if (spawnDaemon)
        unlink(path);
653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672
    return -1;
}
#else
int virNetSocketNewConnectUNIX(const char *path ATTRIBUTE_UNUSED,
                               bool spawnDaemon ATTRIBUTE_UNUSED,
                               const char *binary ATTRIBUTE_UNUSED,
                               virNetSocketPtr *retsock ATTRIBUTE_UNUSED)
{
    virReportSystemError(ENOSYS, "%s",
                         _("UNIX sockets are not supported on this platform"));
    return -1;
}
#endif


#ifndef WIN32
int virNetSocketNewConnectCommand(virCommandPtr cmd,
                                  virNetSocketPtr *retsock)
{
    pid_t pid = 0;
673 674
    int sv[2] = { -1, -1 };
    int errfd[2] = { -1, -1 };
675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711

    *retsock = NULL;

    /* Fork off the external process.  Use socketpair to create a private
     * (unnamed) Unix domain socket to the child process so we don't have
     * to faff around with two file descriptors (a la 'pipe(2)').
     */
    if (socketpair(PF_UNIX, SOCK_STREAM, 0, sv) < 0) {
        virReportSystemError(errno, "%s",
                             _("unable to create socket pair"));
        goto error;
    }

    if (pipe(errfd) < 0) {
        virReportSystemError(errno, "%s",
                             _("unable to create socket pair"));
        goto error;
    }

    virCommandSetInputFD(cmd, sv[1]);
    virCommandSetOutputFD(cmd, &sv[1]);
    virCommandSetErrorFD(cmd, &errfd[1]);

    if (virCommandRunAsync(cmd, &pid) < 0)
        goto error;

    /* Parent continues here. */
    VIR_FORCE_CLOSE(sv[1]);
    VIR_FORCE_CLOSE(errfd[1]);

    if (!(*retsock = virNetSocketNew(NULL, NULL, true, sv[0], errfd[0], pid)))
        goto error;

    virCommandFree(cmd);

    return 0;

712
 error:
713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737
    VIR_FORCE_CLOSE(sv[0]);
    VIR_FORCE_CLOSE(sv[1]);
    VIR_FORCE_CLOSE(errfd[0]);
    VIR_FORCE_CLOSE(errfd[1]);

    virCommandAbort(cmd);
    virCommandFree(cmd);

    return -1;
}
#else
int virNetSocketNewConnectCommand(virCommandPtr cmd ATTRIBUTE_UNUSED,
                                  virNetSocketPtr *retsock ATTRIBUTE_UNUSED)
{
    virReportSystemError(errno, "%s",
                         _("Tunnelling sockets not supported on this platform"));
    return -1;
}
#endif

int virNetSocketNewConnectSSH(const char *nodename,
                              const char *service,
                              const char *binary,
                              const char *username,
                              bool noTTY,
738
                              bool noVerify,
739
                              const char *netcat,
740
                              const char *keyfile,
741 742 743
                              const char *path,
                              virNetSocketPtr *retsock)
{
744
    char *quoted;
745
    virCommandPtr cmd;
746 747
    virBuffer buf = VIR_BUFFER_INITIALIZER;

748 749 750 751
    *retsock = NULL;

    cmd = virCommandNew(binary ? binary : "ssh");
    virCommandAddEnvPassCommon(cmd);
752 753 754 755 756
    virCommandAddEnvPassBlockSUID(cmd, "KRB5CCNAME", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "SSH_AUTH_SOCK", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "SSH_ASKPASS", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "DISPLAY", NULL);
    virCommandAddEnvPassBlockSUID(cmd, "XAUTHORITY", NULL);
757 758 759 760 761 762
    virCommandClearCaps(cmd);

    if (service)
        virCommandAddArgList(cmd, "-p", service, NULL);
    if (username)
        virCommandAddArgList(cmd, "-l", username, NULL);
763 764
    if (keyfile)
        virCommandAddArgList(cmd, "-i", keyfile, NULL);
765 766 767
    if (noTTY)
        virCommandAddArgList(cmd, "-T", "-o", "BatchMode=yes",
                             "-e", "none", NULL);
768 769
    if (noVerify)
        virCommandAddArgList(cmd, "-o", "StrictHostKeyChecking=no", NULL);
770 771 772 773 774

    if (!netcat)
        netcat = "nc";

    virCommandAddArgList(cmd, nodename, "sh", "-c", NULL);
775 776

    virBufferEscapeShell(&buf, netcat);
777
    if (virBufferCheckError(&buf) < 0) {
778
        virCommandFree(cmd);
779 780 781
        return -1;
    }
    quoted = virBufferContentAndReset(&buf);
782 783 784 785 786 787 788 789 790 791 792
    /*
     * This ugly thing is a shell script to detect availability of
     * the -q option for 'nc': debian and suse based distros need this
     * flag to ensure the remote nc will exit on EOF, so it will go away
     * when we close the connection tunnel. If it doesn't go away, subsequent
     * connection attempts will hang.
     *
     * Fedora's 'nc' doesn't have this option, and defaults to the desired
     * behavior.
     */
    virCommandAddArgFormat(cmd,
793
         "'if '%s' -q 2>&1 | grep \"requires an argument\" >/dev/null 2>&1; then "
794 795 796 797
             "ARG=-q0;"
         "else "
             "ARG=;"
         "fi;"
798 799
         "'%s' $ARG -U %s'",
         quoted, quoted, path);
800

801
    VIR_FREE(quoted);
802 803 804
    return virNetSocketNewConnectCommand(cmd, retsock);
}

805
#if WITH_SSH2
806 807 808 809 810 811 812 813 814 815
int
virNetSocketNewConnectLibSSH2(const char *host,
                              const char *port,
                              const char *username,
                              const char *privkey,
                              const char *knownHosts,
                              const char *knownHostsVerify,
                              const char *authMethods,
                              const char *command,
                              virConnectAuthPtr auth,
816
                              virURIPtr uri,
817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860
                              virNetSocketPtr *retsock)
{
    virNetSocketPtr sock = NULL;
    virNetSSHSessionPtr sess = NULL;
    unsigned int verify;
    int ret = -1;
    int portN;

    char *authMethodNext = NULL;
    char *authMethodsCopy = NULL;
    char *authMethod;

    /* port number will be verified while opening the socket */
    if (virStrToLong_i(port, NULL, 10, &portN) < 0) {
        virReportError(VIR_ERR_SSH, "%s",
                       _("Failed to parse port number"));
        goto error;
    }

    /* create ssh session context */
    if (!(sess = virNetSSHSessionNew()))
        goto error;

    /* set ssh session parameters */
    if (virNetSSHSessionAuthSetCallback(sess, auth) != 0)
        goto error;

    if (STRCASEEQ("auto", knownHostsVerify))
        verify = VIR_NET_SSH_HOSTKEY_VERIFY_AUTO_ADD;
    else if (STRCASEEQ("ignore", knownHostsVerify))
        verify = VIR_NET_SSH_HOSTKEY_VERIFY_IGNORE;
    else if (STRCASEEQ("normal", knownHostsVerify))
        verify = VIR_NET_SSH_HOSTKEY_VERIFY_NORMAL;
    else {
        virReportError(VIR_ERR_INVALID_ARG,
                       _("Invalid host key verification method: '%s'"),
                       knownHostsVerify);
        goto error;
    }

    if (virNetSSHSessionSetHostKeyVerification(sess,
                                               host,
                                               portN,
                                               knownHosts,
861 862
                                               verify,
                                               VIR_NET_SSH_HOSTKEY_FILE_CREATE) != 0)
863 864 865 866 867
        goto error;

    if (virNetSSHSessionSetChannelCommand(sess, command) != 0)
        goto error;

868
    if (VIR_STRDUP(authMethodsCopy, authMethods) < 0)
869
        goto error;
870 871

    authMethodNext = authMethodsCopy;
872 873 874 875 876 877

    while ((authMethod = strsep(&authMethodNext, ","))) {
        if (STRCASEEQ(authMethod, "keyboard-interactive"))
            ret = virNetSSHSessionAuthAddKeyboardAuth(sess, username, -1);
        else if (STRCASEEQ(authMethod, "password"))
            ret = virNetSSHSessionAuthAddPasswordAuth(sess,
878 879
                                                      uri,
                                                      username);
880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912
        else if (STRCASEEQ(authMethod, "privkey"))
            ret = virNetSSHSessionAuthAddPrivKeyAuth(sess,
                                                     username,
                                                     privkey,
                                                     NULL);
        else if (STRCASEEQ(authMethod, "agent"))
            ret = virNetSSHSessionAuthAddAgentAuth(sess, username);
        else {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("Invalid authentication method: '%s'"),
                           authMethod);
            ret = -1;
            goto error;
        }

        if (ret != 0)
            goto error;
    }

    /* connect to remote server */
    if ((ret = virNetSocketNewConnectTCP(host, port, &sock)) < 0)
        goto error;

    /* connect to the host using ssh */
    if ((ret = virNetSSHSessionConnect(sess, virNetSocketGetFD(sock))) != 0)
        goto error;

    sock->sshSession = sess;
    *retsock = sock;

    VIR_FREE(authMethodsCopy);
    return 0;

913
 error:
914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929
    virObjectUnref(sock);
    virObjectUnref(sess);
    VIR_FREE(authMethodsCopy);
    return ret;
}
#else
int
virNetSocketNewConnectLibSSH2(const char *host ATTRIBUTE_UNUSED,
                              const char *port ATTRIBUTE_UNUSED,
                              const char *username ATTRIBUTE_UNUSED,
                              const char *privkey ATTRIBUTE_UNUSED,
                              const char *knownHosts ATTRIBUTE_UNUSED,
                              const char *knownHostsVerify ATTRIBUTE_UNUSED,
                              const char *authMethods ATTRIBUTE_UNUSED,
                              const char *command ATTRIBUTE_UNUSED,
                              virConnectAuthPtr auth ATTRIBUTE_UNUSED,
930
                              virURIPtr uri ATTRIBUTE_UNUSED,
931 932 933 934 935 936
                              virNetSocketPtr *retsock ATTRIBUTE_UNUSED)
{
    virReportSystemError(ENOSYS, "%s",
                         _("libssh2 transport support was not enabled"));
    return -1;
}
937
#endif /* WITH_SSH2 */
938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953

int virNetSocketNewConnectExternal(const char **cmdargv,
                                   virNetSocketPtr *retsock)
{
    virCommandPtr cmd;

    *retsock = NULL;

    cmd = virCommandNewArgs(cmdargv);
    virCommandAddEnvPassCommon(cmd);
    virCommandClearCaps(cmd);

    return virNetSocketNewConnectCommand(cmd, retsock);
}


954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971
int virNetSocketNewConnectSockFD(int sockfd,
                                 virNetSocketPtr *retsock)
{
    virSocketAddr localAddr;

    localAddr.len = sizeof(localAddr.data);
    if (getsockname(sockfd, &localAddr.data.sa, &localAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
        return -1;
    }

    if (!(*retsock = virNetSocketNew(&localAddr, NULL, true, sockfd, -1, -1)))
        return -1;

    return 0;
}


972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025
virNetSocketPtr virNetSocketNewPostExecRestart(virJSONValuePtr object)
{
    virSocketAddr localAddr;
    virSocketAddr remoteAddr;
    int fd, thepid, errfd;
    bool isClient;

    if (virJSONValueObjectGetNumberInt(object, "fd", &fd) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Missing fd data in JSON document"));
        return NULL;
    }

    if (virJSONValueObjectGetNumberInt(object, "pid", &thepid) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Missing pid data in JSON document"));
        return NULL;
    }

    if (virJSONValueObjectGetNumberInt(object, "errfd", &errfd) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Missing errfd data in JSON document"));
        return NULL;
    }
    if (virJSONValueObjectGetBoolean(object, "isClient", &isClient) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Missing isClient data in JSON document"));
        return NULL;
    }

    memset(&localAddr, 0, sizeof(localAddr));
    memset(&remoteAddr, 0, sizeof(remoteAddr));

    remoteAddr.len = sizeof(remoteAddr.data.stor);
    if (getsockname(fd, &remoteAddr.data.sa, &remoteAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get peer socket name"));
        return NULL;
    }

    localAddr.len = sizeof(localAddr.data.stor);
    if (getsockname(fd, &localAddr.data.sa, &localAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
        return NULL;
    }

    return virNetSocketNew(&localAddr, &remoteAddr,
                           isClient, fd, errfd, thepid);
}


virJSONValuePtr virNetSocketPreExecRestart(virNetSocketPtr sock)
{
    virJSONValuePtr object = NULL;

1026
    virObjectLock(sock);
1027

1028
#if WITH_SASL
1029 1030 1031 1032 1033 1034
    if (sock->saslSession) {
        virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                       _("Unable to save socket state when SASL session is active"));
        goto error;
    }
#endif
1035
#if WITH_GNUTLS
1036 1037 1038 1039 1040
    if (sock->tlsSession) {
        virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                       _("Unable to save socket state when TLS session is active"));
        goto error;
    }
1041
#endif
1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071

    if (!(object = virJSONValueNewObject()))
        goto error;

    if (virJSONValueObjectAppendNumberInt(object, "fd", sock->fd) < 0)
        goto error;

    if (virJSONValueObjectAppendNumberInt(object, "errfd", sock->errfd) < 0)
        goto error;

    if (virJSONValueObjectAppendNumberInt(object, "pid", sock->pid) < 0)
        goto error;

    if (virJSONValueObjectAppendBoolean(object, "isClient", sock->client) < 0)
        goto error;

    if (virSetInherit(sock->fd, true) < 0) {
        virReportSystemError(errno,
                             _("Cannot disable close-on-exec flag on socket %d"),
                             sock->fd);
        goto error;
    }
    if (sock->errfd != -1 &&
        virSetInherit(sock->errfd, true) < 0) {
        virReportSystemError(errno,
                             _("Cannot disable close-on-exec flag on pipe %d"),
                             sock->errfd);
        goto error;
    }

1072
    virObjectUnlock(sock);
1073 1074
    return object;

1075
 error:
1076
    virObjectUnlock(sock);
1077 1078 1079 1080 1081
    virJSONValueFree(object);
    return NULL;
}


1082
void virNetSocketDispose(void *obj)
1083
{
1084
    virNetSocketPtr sock = obj;
1085

1086 1087 1088
    PROBE(RPC_SOCKET_DISPOSE,
          "sock=%p", sock);

1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101
    if (sock->watch > 0) {
        virEventRemoveHandle(sock->watch);
        sock->watch = -1;
    }

#ifdef HAVE_SYS_UN_H
    /* If a server socket, then unlink UNIX path */
    if (!sock->client &&
        sock->localAddr.data.sa.sa_family == AF_UNIX &&
        sock->localAddr.data.un.sun_path[0] != '\0')
        unlink(sock->localAddr.data.un.sun_path);
#endif

1102
#if WITH_GNUTLS
1103 1104 1105
    /* Make sure it can't send any more I/O during shutdown */
    if (sock->tlsSession)
        virNetTLSSessionSetIOCallbacks(sock->tlsSession, NULL, NULL, NULL);
1106
    virObjectUnref(sock->tlsSession);
1107
#endif
1108
#if WITH_SASL
1109
    virObjectUnref(sock->saslSession);
1110 1111
#endif

1112
#if WITH_SSH2
1113 1114 1115
    virObjectUnref(sock->sshSession);
#endif

1116 1117 1118
    VIR_FORCE_CLOSE(sock->fd);
    VIR_FORCE_CLOSE(sock->errfd);

1119
    virProcessAbort(sock->pid);
1120 1121 1122 1123 1124 1125 1126 1127

    VIR_FREE(sock->localAddrStr);
    VIR_FREE(sock->remoteAddrStr);
}


int virNetSocketGetFD(virNetSocketPtr sock)
{
1128
    int fd;
1129
    virObjectLock(sock);
1130
    fd = sock->fd;
1131
    virObjectUnlock(sock);
1132
    return fd;
1133 1134 1135
}


1136 1137 1138 1139 1140
int virNetSocketDupFD(virNetSocketPtr sock, bool cloexec)
{
    int fd;

    if (cloexec)
1141
        fd = fcntl(sock->fd, F_DUPFD_CLOEXEC, 0);
1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152
    else
        fd = dup(sock->fd);
    if (fd < 0) {
        virReportSystemError(errno, "%s",
                             _("Unable to copy socket file handle"));
        return -1;
    }
    return fd;
}


1153 1154
bool virNetSocketIsLocal(virNetSocketPtr sock)
{
1155
    bool isLocal = false;
1156
    virObjectLock(sock);
1157
    if (sock->localAddr.data.sa.sa_family == AF_UNIX)
1158
        isLocal = true;
1159
    virObjectUnlock(sock);
1160
    return isLocal;
1161 1162 1163
}


1164 1165 1166
bool virNetSocketHasPassFD(virNetSocketPtr sock)
{
    bool hasPassFD = false;
1167
    virObjectLock(sock);
1168 1169
    if (sock->localAddr.data.sa.sa_family == AF_UNIX)
        hasPassFD = true;
1170
    virObjectUnlock(sock);
1171 1172 1173 1174
    return hasPassFD;
}


1175 1176
int virNetSocketGetPort(virNetSocketPtr sock)
{
1177
    int port;
1178
    virObjectLock(sock);
1179
    port = virSocketAddrGetPort(&sock->localAddr);
1180
    virObjectUnlock(sock);
1181
    return port;
1182 1183 1184
}


1185
#if defined(SO_PEERCRED)
1186 1187 1188
int virNetSocketGetUNIXIdentity(virNetSocketPtr sock,
                                uid_t *uid,
                                gid_t *gid,
1189 1190
                                pid_t *pid,
                                unsigned long long *timestamp)
1191 1192
{
    struct ucred cr;
1193
    socklen_t cr_len = sizeof(cr);
1194 1195
    int ret = -1;

1196
    virObjectLock(sock);
1197 1198 1199 1200

    if (getsockopt(sock->fd, SOL_SOCKET, SO_PEERCRED, &cr, &cr_len) < 0) {
        virReportSystemError(errno, "%s",
                             _("Failed to get client socket identity"));
1201
        goto cleanup;
1202 1203
    }

1204 1205 1206
    if (virProcessGetStartTime(cr.pid, timestamp) < 0)
        goto cleanup;

1207 1208
    *pid = cr.pid;
    *uid = cr.uid;
1209
    *gid = cr.gid;
1210

1211 1212
    ret = 0;

1213
 cleanup:
1214
    virObjectUnlock(sock);
1215
    return ret;
1216
}
1217
#elif defined(LOCAL_PEERCRED)
1218

1219 1220 1221
/* VIR_SOL_PEERCRED - the value needed to let getsockopt() work with
 * LOCAL_PEERCRED
 */
1222 1223 1224 1225

/* Mac OS X 10.8 provides SOL_LOCAL for LOCAL_PEERCRED */
# ifdef SOL_LOCAL
#  define VIR_SOL_PEERCRED SOL_LOCAL
1226
# else
1227 1228 1229 1230 1231 1232
/* FreeBSD and Mac OS X prior to 10.7, SOL_LOCAL is not defined and
 * users are expected to supply 0 as the second value for getsockopt()
 * when using LOCAL_PEERCRED. NB SOL_SOCKET cannot be used instead
 * of SOL_LOCAL
 */
#  define VIR_SOL_PEERCRED 0
1233 1234
# endif

1235 1236 1237
int virNetSocketGetUNIXIdentity(virNetSocketPtr sock,
                                uid_t *uid,
                                gid_t *gid,
1238
                                pid_t *pid,
1239
                                unsigned long long *timestamp)
1240 1241 1242
{
    struct xucred cr;
    socklen_t cr_len = sizeof(cr);
1243 1244
    int ret = -1;

1245
    virObjectLock(sock);
1246

1247
    cr.cr_ngroups = -1;
1248
    if (getsockopt(sock->fd, VIR_SOL_PEERCRED, LOCAL_PEERCRED, &cr, &cr_len) < 0) {
1249 1250
        virReportSystemError(errno, "%s",
                             _("Failed to get client socket identity"));
1251
        goto cleanup;
1252 1253
    }

1254 1255 1256
    if (cr.cr_version != XUCRED_VERSION) {
        virReportError(VIR_ERR_SYSTEM_ERROR, "%s",
                       _("Failed to get valid client socket identity"));
1257
        goto cleanup;
1258 1259
    }

1260
    if (cr.cr_ngroups <= 0 || cr.cr_ngroups > NGROUPS) {
1261 1262
        virReportError(VIR_ERR_SYSTEM_ERROR, "%s",
                       _("Failed to get valid client socket identity groups"));
1263
        goto cleanup;
1264 1265
    }

1266 1267 1268
    /* PID and process creation time are not supported on BSDs by
     * LOCAL_PEERCRED.
     */
1269
    *pid = -1;
1270
    *timestamp = -1;
1271 1272 1273
    *uid = cr.cr_uid;
    *gid = cr.cr_gid;

1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295
# ifdef LOCAL_PEERPID
    /* Exists on Mac OS X 10.8 for retrieving the peer's PID */
    cr_len = sizeof(*pid);

    if (getsockopt(sock->fd, VIR_SOL_PEERCRED, LOCAL_PEERPID, pid, &cr_len) < 0) {
        /* Ensure this is set to something sane as there are no guarantees
         * as to what its set to now.
         */
        *pid = -1;

        /* If this was built on a system with LOCAL_PEERPID defined but
         * the kernel doesn't support it we'll get back EOPNOTSUPP so
         * treat all errors but EOPNOTSUPP as fatal
         */
        if (errno != EOPNOTSUPP) {
            virReportSystemError(errno, "%s",
                    _("Failed to get client socket PID"));
            goto cleanup;
        }
    }
# endif

1296 1297
    ret = 0;

1298
 cleanup:
1299
    virObjectUnlock(sock);
1300
    return ret;
1301
}
1302
#else
1303 1304 1305
int virNetSocketGetUNIXIdentity(virNetSocketPtr sock ATTRIBUTE_UNUSED,
                                uid_t *uid ATTRIBUTE_UNUSED,
                                gid_t *gid ATTRIBUTE_UNUSED,
1306 1307
                                pid_t *pid ATTRIBUTE_UNUSED,
                                unsigned long long *timestamp ATTRIBUTE_UNUSED)
1308 1309 1310 1311 1312 1313 1314 1315
{
    /* XXX Many more OS support UNIX socket credentials we could port to. See dbus ....*/
    virReportSystemError(ENOSYS, "%s",
                         _("Client socket identity not available"));
    return -1;
}
#endif

1316
#ifdef WITH_SELINUX
1317 1318
int virNetSocketGetSELinuxContext(virNetSocketPtr sock,
                                  char **context)
1319 1320 1321 1322 1323 1324
{
    security_context_t seccon = NULL;
    int ret = -1;

    *context = NULL;

1325
    virObjectLock(sock);
1326
    if (getpeercon(sock->fd, &seccon) < 0) {
1327
        if (errno == ENOSYS || errno == ENOPROTOOPT) {
1328 1329 1330 1331 1332 1333 1334 1335
            ret = 0;
            goto cleanup;
        }
        virReportSystemError(errno, "%s",
                             _("Unable to query peer security context"));
        goto cleanup;
    }

1336
    if (VIR_STRDUP(*context, seccon) < 0)
1337 1338 1339
        goto cleanup;

    ret = 0;
1340
 cleanup:
1341
    freecon(seccon);
1342
    virObjectUnlock(sock);
1343 1344 1345
    return ret;
}
#else
1346 1347
int virNetSocketGetSELinuxContext(virNetSocketPtr sock ATTRIBUTE_UNUSED,
                                  char **context)
1348 1349 1350 1351 1352 1353
{
    *context = NULL;
    return 0;
}
#endif

1354 1355 1356 1357

int virNetSocketSetBlocking(virNetSocketPtr sock,
                            bool blocking)
{
1358
    int ret;
1359
    virObjectLock(sock);
1360
    ret = virSetBlocking(sock->fd, blocking);
1361
    virObjectUnlock(sock);
1362
    return ret;
1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375
}


const char *virNetSocketLocalAddrString(virNetSocketPtr sock)
{
    return sock->localAddrStr;
}

const char *virNetSocketRemoteAddrString(virNetSocketPtr sock)
{
    return sock->remoteAddrStr;
}

1376

1377
#if WITH_GNUTLS
1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398
static ssize_t virNetSocketTLSSessionWrite(const char *buf,
                                           size_t len,
                                           void *opaque)
{
    virNetSocketPtr sock = opaque;
    return write(sock->fd, buf, len);
}


static ssize_t virNetSocketTLSSessionRead(char *buf,
                                          size_t len,
                                          void *opaque)
{
    virNetSocketPtr sock = opaque;
    return read(sock->fd, buf, len);
}


void virNetSocketSetTLSSession(virNetSocketPtr sock,
                               virNetTLSSessionPtr sess)
{
1399
    virObjectLock(sock);
1400 1401
    virObjectUnref(sock->tlsSession);
    sock->tlsSession = virObjectRef(sess);
1402 1403 1404 1405
    virNetTLSSessionSetIOCallbacks(sess,
                                   virNetSocketTLSSessionWrite,
                                   virNetSocketTLSSessionRead,
                                   sock);
1406
    virObjectUnlock(sock);
1407
}
1408
#endif
1409

1410
#if WITH_SASL
1411 1412 1413
void virNetSocketSetSASLSession(virNetSocketPtr sock,
                                virNetSASLSessionPtr sess)
{
1414
    virObjectLock(sock);
1415 1416
    virObjectUnref(sock->saslSession);
    sock->saslSession = virObjectRef(sess);
1417
    virObjectUnlock(sock);
1418 1419 1420 1421 1422 1423
}
#endif


bool virNetSocketHasCachedData(virNetSocketPtr sock ATTRIBUTE_UNUSED)
{
1424
    bool hasCached = false;
1425
    virObjectLock(sock);
1426

1427
#if WITH_SSH2
1428 1429 1430 1431
    if (virNetSSHSessionHasCachedData(sock->sshSession))
        hasCached = true;
#endif

1432
#if WITH_SASL
1433
    if (sock->saslDecoded)
1434
        hasCached = true;
1435
#endif
1436
    virObjectUnlock(sock);
1437
    return hasCached;
1438 1439
}

1440
#if WITH_SSH2
1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454
static ssize_t virNetSocketLibSSH2Read(virNetSocketPtr sock,
                                       char *buf,
                                       size_t len)
{
    return virNetSSHChannelRead(sock->sshSession, buf, len);
}

static ssize_t virNetSocketLibSSH2Write(virNetSocketPtr sock,
                                        const char *buf,
                                        size_t len)
{
    return virNetSSHChannelWrite(sock->sshSession, buf, len);
}
#endif
1455

1456 1457 1458
bool virNetSocketHasPendingData(virNetSocketPtr sock ATTRIBUTE_UNUSED)
{
    bool hasPending = false;
1459
    virObjectLock(sock);
1460
#if WITH_SASL
1461 1462 1463
    if (sock->saslEncoded)
        hasPending = true;
#endif
1464
    virObjectUnlock(sock);
1465 1466 1467 1468
    return hasPending;
}


1469
static ssize_t virNetSocketReadWire(virNetSocketPtr sock, char *buf, size_t len)
1470 1471 1472
{
    char *errout = NULL;
    ssize_t ret;
1473

1474
#if WITH_SSH2
1475 1476 1477 1478
    if (sock->sshSession)
        return virNetSocketLibSSH2Read(sock, buf, len);
#endif

1479
 reread:
1480
#if WITH_GNUTLS
1481 1482 1483 1484 1485
    if (sock->tlsSession &&
        virNetTLSSessionGetHandshakeStatus(sock->tlsSession) ==
        VIR_NET_TLS_HANDSHAKE_COMPLETE) {
        ret = virNetTLSSessionRead(sock->tlsSession, buf, len);
    } else {
1486
#endif
1487
        ret = read(sock->fd, buf, len);
1488
#if WITH_GNUTLS
1489
    }
1490
#endif
1491 1492 1493 1494 1495

    if ((ret < 0) && (errno == EINTR))
        goto reread;
    if ((ret < 0) && (errno == EAGAIN))
        return 0;
1496

1497 1498 1499 1500 1501
    if (ret <= 0 &&
        sock->errfd != -1 &&
        virFileReadLimFD(sock->errfd, 1024, &errout) >= 0 &&
        errout != NULL) {
        size_t elen = strlen(errout);
1502 1503 1504
        /* remove trailing whitespace */
        while (elen && c_isspace(errout[elen - 1]))
            errout[--elen] = '\0';
1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528
    }

    if (ret < 0) {
        if (errout)
            virReportSystemError(errno,
                                 _("Cannot recv data: %s"), errout);
        else
            virReportSystemError(errno, "%s",
                                 _("Cannot recv data"));
        ret = -1;
    } else if (ret == 0) {
        if (errout)
            virReportSystemError(EIO,
                                 _("End of file while reading data: %s"), errout);
        else
            virReportSystemError(EIO, "%s",
                                 _("End of file while reading data"));
        ret = -1;
    }

    VIR_FREE(errout);
    return ret;
}

1529
static ssize_t virNetSocketWriteWire(virNetSocketPtr sock, const char *buf, size_t len)
1530 1531
{
    ssize_t ret;
1532

1533
#if WITH_SSH2
1534 1535 1536 1537
    if (sock->sshSession)
        return virNetSocketLibSSH2Write(sock, buf, len);
#endif

1538
 rewrite:
1539
#if WITH_GNUTLS
1540 1541 1542 1543 1544
    if (sock->tlsSession &&
        virNetTLSSessionGetHandshakeStatus(sock->tlsSession) ==
        VIR_NET_TLS_HANDSHAKE_COMPLETE) {
        ret = virNetTLSSessionWrite(sock->tlsSession, buf, len);
    } else {
1545
#endif
1546
        ret = write(sock->fd, buf, len);
1547
#if WITH_GNUTLS
1548
    }
1549
#endif
1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570

    if (ret < 0) {
        if (errno == EINTR)
            goto rewrite;
        if (errno == EAGAIN)
            return 0;

        virReportSystemError(errno, "%s",
                             _("Cannot write data"));
        return -1;
    }
    if (ret == 0) {
        virReportSystemError(EIO, "%s",
                             _("End of file while writing data"));
        return -1;
    }

    return ret;
}


1571
#if WITH_SASL
1572 1573 1574 1575 1576 1577 1578 1579
static ssize_t virNetSocketReadSASL(virNetSocketPtr sock, char *buf, size_t len)
{
    ssize_t got;

    /* Need to read some more data off the wire */
    if (sock->saslDecoded == NULL) {
        ssize_t encodedLen = virNetSASLSessionGetMaxBufSize(sock->saslSession);
        char *encoded;
1580
        if (VIR_ALLOC_N(encoded, encodedLen) < 0)
1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669
            return -1;
        encodedLen = virNetSocketReadWire(sock, encoded, encodedLen);

        if (encodedLen <= 0) {
            VIR_FREE(encoded);
            return encodedLen;
        }

        if (virNetSASLSessionDecode(sock->saslSession,
                                    encoded, encodedLen,
                                    &sock->saslDecoded, &sock->saslDecodedLength) < 0) {
            VIR_FREE(encoded);
            return -1;
        }
        VIR_FREE(encoded);

        sock->saslDecodedOffset = 0;
    }

    /* Some buffered decoded data to return now */
    got = sock->saslDecodedLength - sock->saslDecodedOffset;

    if (len > got)
        len = got;

    memcpy(buf, sock->saslDecoded + sock->saslDecodedOffset, len);
    sock->saslDecodedOffset += len;

    if (sock->saslDecodedOffset == sock->saslDecodedLength) {
        sock->saslDecoded = NULL;
        sock->saslDecodedOffset = sock->saslDecodedLength = 0;
    }

    return len;
}


static ssize_t virNetSocketWriteSASL(virNetSocketPtr sock, const char *buf, size_t len)
{
    int ret;
    size_t tosend = virNetSASLSessionGetMaxBufSize(sock->saslSession);

    /* SASL doesn't necessarily let us send the whole
       buffer at once */
    if (tosend > len)
        tosend = len;

    /* Not got any pending encoded data, so we need to encode raw stuff */
    if (sock->saslEncoded == NULL) {
        if (virNetSASLSessionEncode(sock->saslSession,
                                    buf, tosend,
                                    &sock->saslEncoded,
                                    &sock->saslEncodedLength) < 0)
            return -1;

        sock->saslEncodedOffset = 0;
    }

    /* Send some of the encoded stuff out on the wire */
    ret = virNetSocketWriteWire(sock,
                                sock->saslEncoded + sock->saslEncodedOffset,
                                sock->saslEncodedLength - sock->saslEncodedOffset);

    if (ret <= 0)
        return ret; /* -1 error, 0 == egain */

    /* Note how much we sent */
    sock->saslEncodedOffset += ret;

    /* Sent all encoded, so update raw buffer to indicate completion */
    if (sock->saslEncodedOffset == sock->saslEncodedLength) {
        sock->saslEncoded = NULL;
        sock->saslEncodedOffset = sock->saslEncodedLength = 0;

        /* Mark as complete, so caller detects completion */
        return tosend;
    } else {
        /* Still have stuff pending in saslEncoded buffer.
         * Pretend to caller that we didn't send any yet.
         * The caller will then retry with same buffer
         * shortly, which lets us finish saslEncoded.
         */
        return 0;
    }
}
#endif

ssize_t virNetSocketRead(virNetSocketPtr sock, char *buf, size_t len)
{
1670
    ssize_t ret;
1671
    virObjectLock(sock);
1672
#if WITH_SASL
1673
    if (sock->saslSession)
1674
        ret = virNetSocketReadSASL(sock, buf, len);
1675 1676
    else
#endif
1677
        ret = virNetSocketReadWire(sock, buf, len);
1678
    virObjectUnlock(sock);
1679
    return ret;
1680 1681 1682 1683
}

ssize_t virNetSocketWrite(virNetSocketPtr sock, const char *buf, size_t len)
{
1684 1685
    ssize_t ret;

1686
    virObjectLock(sock);
1687
#if WITH_SASL
1688
    if (sock->saslSession)
1689
        ret = virNetSocketWriteSASL(sock, buf, len);
1690 1691
    else
#endif
1692
        ret = virNetSocketWriteWire(sock, buf, len);
1693
    virObjectUnlock(sock);
1694
    return ret;
1695 1696 1697
}


1698 1699 1700
/*
 * Returns 1 if an FD was sent, 0 if it would block, -1 on error
 */
1701 1702 1703 1704
int virNetSocketSendFD(virNetSocketPtr sock, int fd)
{
    int ret = -1;
    if (!virNetSocketHasPassFD(sock)) {
1705
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
1706
                       _("Sending file descriptors is not supported on this socket"));
1707 1708
        return -1;
    }
1709
    virObjectLock(sock);
1710 1711 1712
    PROBE(RPC_SOCKET_SEND_FD,
          "sock=%p fd=%d", sock, fd);
    if (sendfd(sock->fd, fd) < 0) {
1713 1714 1715 1716 1717 1718
        if (errno == EAGAIN)
            ret = 0;
        else
            virReportSystemError(errno,
                                 _("Failed to send file descriptor %d"),
                                 fd);
1719 1720
        goto cleanup;
    }
1721
    ret = 1;
1722

1723
 cleanup:
1724
    virObjectUnlock(sock);
1725 1726 1727 1728
    return ret;
}


1729 1730 1731 1732
/*
 * Returns 1 if an FD was read, 0 if it would block, -1 on error
 */
int virNetSocketRecvFD(virNetSocketPtr sock, int *fd)
1733 1734
{
    int ret = -1;
1735 1736 1737

    *fd = -1;

1738
    if (!virNetSocketHasPassFD(sock)) {
1739
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
1740
                       _("Receiving file descriptors is not supported on this socket"));
1741 1742
        return -1;
    }
1743
    virObjectLock(sock);
1744

1745 1746 1747 1748 1749 1750
    if ((*fd = recvfd(sock->fd, O_CLOEXEC)) < 0) {
        if (errno == EAGAIN)
            ret = 0;
        else
            virReportSystemError(errno, "%s",
                                 _("Failed to recv file descriptor"));
1751 1752 1753
        goto cleanup;
    }
    PROBE(RPC_SOCKET_RECV_FD,
1754 1755
          "sock=%p fd=%d", sock, *fd);
    ret = 1;
1756

1757
 cleanup:
1758
    virObjectUnlock(sock);
1759 1760 1761 1762
    return ret;
}


1763
int virNetSocketListen(virNetSocketPtr sock, int backlog)
1764
{
1765
    virObjectLock(sock);
1766
    if (listen(sock->fd, backlog > 0 ? backlog : 30) < 0) {
1767
        virReportSystemError(errno, "%s", _("Unable to listen on socket"));
1768
        virObjectUnlock(sock);
1769 1770
        return -1;
    }
1771
    virObjectUnlock(sock);
1772 1773 1774 1775 1776
    return 0;
}

int virNetSocketAccept(virNetSocketPtr sock, virNetSocketPtr *clientsock)
{
1777
    int fd = -1;
1778 1779
    virSocketAddr localAddr;
    virSocketAddr remoteAddr;
1780 1781
    int ret = -1;

1782
    virObjectLock(sock);
1783 1784 1785 1786 1787 1788 1789 1790 1791

    *clientsock = NULL;

    memset(&localAddr, 0, sizeof(localAddr));
    memset(&remoteAddr, 0, sizeof(remoteAddr));

    remoteAddr.len = sizeof(remoteAddr.data.stor);
    if ((fd = accept(sock->fd, &remoteAddr.data.sa, &remoteAddr.len)) < 0) {
        if (errno == ECONNABORTED ||
1792 1793 1794 1795
            errno == EAGAIN) {
            ret = 0;
            goto cleanup;
        }
1796 1797 1798

        virReportSystemError(errno, "%s",
                             _("Unable to accept client"));
1799
        goto cleanup;
1800 1801 1802 1803 1804
    }

    localAddr.len = sizeof(localAddr.data);
    if (getsockname(fd, &localAddr.data.sa, &localAddr.len) < 0) {
        virReportSystemError(errno, "%s", _("Unable to get local socket name"));
1805
        goto cleanup;
1806 1807 1808 1809 1810
    }

    if (!(*clientsock = virNetSocketNew(&localAddr,
                                        &remoteAddr,
                                        true,
1811 1812
                                        fd, -1, 0)))
        goto cleanup;
1813

1814 1815 1816
    fd = -1;
    ret = 0;

1817
 cleanup:
1818
    VIR_FORCE_CLOSE(fd);
1819
    virObjectUnlock(sock);
1820
    return ret;
1821 1822 1823
}


W
Wen Congyang 已提交
1824 1825
static void virNetSocketEventHandle(int watch ATTRIBUTE_UNUSED,
                                    int fd ATTRIBUTE_UNUSED,
1826 1827 1828 1829
                                    int events,
                                    void *opaque)
{
    virNetSocketPtr sock = opaque;
1830 1831
    virNetSocketIOFunc func;
    void *eopaque;
1832

1833
    virObjectLock(sock);
1834 1835
    func = sock->func;
    eopaque = sock->opaque;
1836
    virObjectUnlock(sock);
1837 1838 1839

    if (func)
        func(sock, events, eopaque);
1840 1841
}

1842

1843 1844 1845 1846 1847 1848
static void virNetSocketEventFree(void *opaque)
{
    virNetSocketPtr sock = opaque;
    virFreeCallback ff;
    void *eopaque;

1849
    virObjectLock(sock);
1850 1851 1852 1853 1854
    ff = sock->ff;
    eopaque = sock->opaque;
    sock->func = NULL;
    sock->ff = NULL;
    sock->opaque = NULL;
1855
    virObjectUnlock(sock);
1856 1857 1858 1859

    if (ff)
        ff(eopaque);

1860
    virObjectUnref(sock);
1861 1862
}

1863 1864 1865
int virNetSocketAddIOCallback(virNetSocketPtr sock,
                              int events,
                              virNetSocketIOFunc func,
1866 1867
                              void *opaque,
                              virFreeCallback ff)
1868
{
1869 1870
    int ret = -1;

1871
    virObjectRef(sock);
1872
    virObjectLock(sock);
1873 1874
    if (sock->watch > 0) {
        VIR_DEBUG("Watch already registered on socket %p", sock);
1875
        goto cleanup;
1876 1877 1878 1879 1880 1881
    }

    if ((sock->watch = virEventAddHandle(sock->fd,
                                         events,
                                         virNetSocketEventHandle,
                                         sock,
1882
                                         virNetSocketEventFree)) < 0) {
1883
        VIR_DEBUG("Failed to register watch on socket %p", sock);
1884
        goto cleanup;
1885 1886 1887
    }
    sock->func = func;
    sock->opaque = opaque;
1888
    sock->ff = ff;
1889

1890 1891
    ret = 0;

1892
 cleanup:
1893
    virObjectUnlock(sock);
1894
    if (ret != 0)
1895
        virObjectUnref(sock);
1896
    return ret;
1897 1898 1899 1900 1901
}

void virNetSocketUpdateIOCallback(virNetSocketPtr sock,
                                  int events)
{
1902
    virObjectLock(sock);
1903 1904
    if (sock->watch <= 0) {
        VIR_DEBUG("Watch not registered on socket %p", sock);
1905
        virObjectUnlock(sock);
1906 1907 1908 1909
        return;
    }

    virEventUpdateHandle(sock->watch, events);
1910

1911
    virObjectUnlock(sock);
1912 1913 1914 1915
}

void virNetSocketRemoveIOCallback(virNetSocketPtr sock)
{
1916
    virObjectLock(sock);
1917

1918 1919
    if (sock->watch <= 0) {
        VIR_DEBUG("Watch not registered on socket %p", sock);
1920
        virObjectUnlock(sock);
1921 1922 1923 1924
        return;
    }

    virEventRemoveHandle(sock->watch);
1925

1926
    virObjectUnlock(sock);
1927
}
1928 1929 1930 1931 1932 1933

void virNetSocketClose(virNetSocketPtr sock)
{
    if (!sock)
        return;

1934
    virObjectLock(sock);
1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947

    VIR_FORCE_CLOSE(sock->fd);

#ifdef HAVE_SYS_UN_H
    /* If a server socket, then unlink UNIX path */
    if (!sock->client &&
        sock->localAddr.data.sa.sa_family == AF_UNIX &&
        sock->localAddr.data.un.sun_path[0] != '\0') {
        if (unlink(sock->localAddr.data.un.sun_path) == 0)
            sock->localAddr.data.un.sun_path[0] = '\0';
    }
#endif

1948
    virObjectUnlock(sock);
1949
}