lxc_driver.c 69.5 KB
Newer Older
D
Daniel Veillard 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright IBM Corp. 2008
 *
 * lxc_driver.c: linux container driver functions
 *
 * Authors:
 *  David L. Leskovec <dlesko at linux.vnet.ibm.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 */

#include <config.h>

26
#include <fcntl.h>
D
Daniel Veillard 已提交
27 28
#include <sched.h>
#include <sys/utsname.h>
D
David L. Leskovec 已提交
29
#include <stdbool.h>
D
Daniel Veillard 已提交
30 31
#include <string.h>
#include <sys/types.h>
32 33 34
#include <sys/socket.h>
#include <sys/un.h>
#include <sys/poll.h>
D
Daniel Veillard 已提交
35 36 37
#include <unistd.h>
#include <wait.h>

38
#include "virterror_internal.h"
39
#include "logging.h"
40
#include "datatypes.h"
D
Daniel Veillard 已提交
41
#include "lxc_conf.h"
42
#include "lxc_container.h"
D
Daniel Veillard 已提交
43
#include "lxc_driver.h"
44
#include "memory.h"
45
#include "util.h"
46 47
#include "bridge.h"
#include "veth.h"
48
#include "event.h"
49
#include "nodeinfo.h"
50
#include "uuid.h"
51
#include "stats_linux.h"
52

D
Daniel Veillard 已提交
53

54 55
#define VIR_FROM_THIS VIR_FROM_LXC

56 57 58 59 60 61 62 63
typedef struct _lxcDomainObjPrivate lxcDomainObjPrivate;
typedef lxcDomainObjPrivate *lxcDomainObjPrivatePtr;
struct _lxcDomainObjPrivate {
    int monitor;
    int monitorWatch;
};


64
static int lxcStartup(int privileged);
65
static int lxcShutdown(void);
66
static lxc_driver_t *lxc_driver = NULL;
D
Daniel Veillard 已提交
67 68 69

/* Functions */

70 71
static void lxcDriverLock(lxc_driver_t *driver)
{
72
    virMutexLock(&driver->lock);
73 74 75
}
static void lxcDriverUnlock(lxc_driver_t *driver)
{
76
    virMutexUnlock(&driver->lock);
77 78
}

79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
static void *lxcDomainObjPrivateAlloc(void)
{
    lxcDomainObjPrivatePtr priv;

    if (VIR_ALLOC(priv) < 0)
        return NULL;

    priv->monitor = -1;
    priv->monitorWatch = -1;

    return priv;
}

static void lxcDomainObjPrivateFree(void *data)
{
    lxcDomainObjPrivatePtr priv = data;

    VIR_FREE(priv);
}


100 101 102 103
static void lxcDomainEventFlush(int timer, void *opaque);
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                virDomainEventPtr event);

104

D
Daniel Veillard 已提交
105 106 107 108 109
static virDrvOpenStatus lxcOpen(virConnectPtr conn,
                                virConnectAuthPtr auth ATTRIBUTE_UNUSED,
                                int flags ATTRIBUTE_UNUSED)
{
    /* Verify uri was specified */
110
    if (conn->uri == NULL) {
111 112
        if (lxc_driver == NULL)
            return VIR_DRV_OPEN_DECLINED;
113

114 115
        conn->uri = xmlParseURI("lxc:///");
        if (!conn->uri) {
116
            virReportOOMError();
117 118
            return VIR_DRV_OPEN_ERROR;
        }
119 120 121 122 123 124 125 126 127 128
    } else {
        if (conn->uri->scheme == NULL ||
            STRNEQ(conn->uri->scheme, "lxc"))
            return VIR_DRV_OPEN_DECLINED;

        /* Leave for remote driver */
        if (conn->uri->server != NULL)
            return VIR_DRV_OPEN_DECLINED;

        /* If path isn't '/' then they typoed, tell them correct path */
129 130
        if (conn->uri->path != NULL &&
            STRNEQ(conn->uri->path, "/")) {
131
            lxcError(VIR_ERR_INTERNAL_ERROR,
132
                     _("Unexpected LXC URI path '%s', try lxc:///"),
133 134 135
                     conn->uri->path);
            return VIR_DRV_OPEN_ERROR;
        }
D
Daniel Veillard 已提交
136

137 138
        /* URI was good, but driver isn't active */
        if (lxc_driver == NULL) {
139
            lxcError(VIR_ERR_INTERNAL_ERROR,
140
                     "%s", _("lxc state driver is not active"));
141 142 143
            return VIR_DRV_OPEN_ERROR;
        }
    }
144

145
    conn->privateData = lxc_driver;
D
Daniel Veillard 已提交
146 147 148 149 150 151

    return VIR_DRV_OPEN_SUCCESS;
}

static int lxcClose(virConnectPtr conn)
{
152 153 154 155 156 157
    lxc_driver_t *driver = conn->privateData;

    lxcDriverLock(driver);
    virDomainEventCallbackListRemoveConn(conn, driver->domainEventCallbacks);
    lxcDriverUnlock(driver);

158 159
    conn->privateData = NULL;
    return 0;
D
Daniel Veillard 已提交
160 161
}

162 163 164 165 166 167 168 169 170 171 172 173 174 175 176

static int lxcIsSecure(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Trivially secure, since always inside the daemon */
    return 1;
}


static int lxcIsEncrypted(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Not encrypted, but remote driver takes care of that */
    return 0;
}


177 178 179 180 181 182
static char *lxcGetCapabilities(virConnectPtr conn) {
    lxc_driver_t *driver = conn->privateData;
    char *xml;

    lxcDriverLock(driver);
    if ((xml = virCapabilitiesFormatXML(driver->caps)) == NULL)
183
        virReportOOMError();
184 185 186 187 188 189
    lxcDriverUnlock(driver);

    return xml;
}


D
Daniel Veillard 已提交
190 191 192
static virDomainPtr lxcDomainLookupByID(virConnectPtr conn,
                                        int id)
{
193 194 195
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
196

197
    lxcDriverLock(driver);
198
    vm = virDomainFindByID(&driver->domains, id);
199 200
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
201
    if (!vm) {
202
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
203
        goto cleanup;
D
Daniel Veillard 已提交
204 205 206
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
207
    if (dom)
D
Daniel Veillard 已提交
208 209
        dom->id = vm->def->id;

210
cleanup:
211 212
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
213 214 215 216 217 218
    return dom;
}

static virDomainPtr lxcDomainLookupByUUID(virConnectPtr conn,
                                          const unsigned char *uuid)
{
219 220 221
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
222

223
    lxcDriverLock(driver);
224
    vm = virDomainFindByUUID(&driver->domains, uuid);
225 226
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
227
    if (!vm) {
228
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
229
        goto cleanup;
D
Daniel Veillard 已提交
230 231 232
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
233
    if (dom)
D
Daniel Veillard 已提交
234 235
        dom->id = vm->def->id;

236
cleanup:
237 238
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
239 240 241 242 243 244
    return dom;
}

static virDomainPtr lxcDomainLookupByName(virConnectPtr conn,
                                          const char *name)
{
245 246 247
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
248

249
    lxcDriverLock(driver);
250
    vm = virDomainFindByName(&driver->domains, name);
251
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
252
    if (!vm) {
253
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
254
        goto cleanup;
D
Daniel Veillard 已提交
255 256 257
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
258
    if (dom)
D
Daniel Veillard 已提交
259 260
        dom->id = vm->def->id;

261
cleanup:
262 263
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
264 265 266
    return dom;
}

267 268 269 270 271 272 273 274 275 276 277

static int lxcDomainIsActive(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
278
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
        goto cleanup;
    }
    ret = virDomainObjIsActive(obj);

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


static int lxcDomainIsPersistent(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
300
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
301 302 303 304 305 306 307 308 309 310 311
        goto cleanup;
    }
    ret = obj->persistent;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


312
static int lxcListDomains(virConnectPtr conn, int *ids, int nids) {
313
    lxc_driver_t *driver = conn->privateData;
314
    int n;
315

316
    lxcDriverLock(driver);
317
    n = virDomainObjListGetActiveIDs(&driver->domains, ids, nids);
318
    lxcDriverUnlock(driver);
319

320
    return n;
D
Daniel Veillard 已提交
321
}
322

323
static int lxcNumDomains(virConnectPtr conn) {
324
    lxc_driver_t *driver = conn->privateData;
325
    int n;
326

327
    lxcDriverLock(driver);
328
    n = virDomainObjListNumOfDomains(&driver->domains, 1);
329
    lxcDriverUnlock(driver);
330

331
    return n;
D
Daniel Veillard 已提交
332 333 334
}

static int lxcListDefinedDomains(virConnectPtr conn,
335
                                 char **const names, int nnames) {
336
    lxc_driver_t *driver = conn->privateData;
337
    int n;
338

339
    lxcDriverLock(driver);
340
    n = virDomainObjListGetInactiveNames(&driver->domains, names, nnames);
341
    lxcDriverUnlock(driver);
342

343
    return n;
D
Daniel Veillard 已提交
344 345 346
}


347
static int lxcNumDefinedDomains(virConnectPtr conn) {
348
    lxc_driver_t *driver = conn->privateData;
349
    int n;
350

351
    lxcDriverLock(driver);
352
    n = virDomainObjListNumOfDomains(&driver->domains, 0);
353
    lxcDriverUnlock(driver);
354

355
    return n;
D
Daniel Veillard 已提交
356 357
}

358 359


D
Daniel Veillard 已提交
360 361
static virDomainPtr lxcDomainDefine(virConnectPtr conn, const char *xml)
{
362 363
    lxc_driver_t *driver = conn->privateData;
    virDomainDefPtr def = NULL;
364
    virDomainObjPtr vm = NULL;
365
    virDomainPtr dom = NULL;
366
    virDomainEventPtr event = NULL;
367
    int dupVM;
D
Daniel Veillard 已提交
368

369
    lxcDriverLock(driver);
370
    if (!(def = virDomainDefParseString(driver->caps, xml,
371
                                        VIR_DOMAIN_XML_INACTIVE)))
372
        goto cleanup;
D
Daniel Veillard 已提交
373

374 375
   if ((dupVM = virDomainObjIsDuplicate(&driver->domains, def, 0)) < 0)
        goto cleanup;
376

377
    if ((def->nets != NULL) && !(driver->have_netns)) {
378
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
379
                 "%s", _("System lacks NETNS support"));
380
        goto cleanup;
381 382
    }

383
    if (!(vm = virDomainAssignDef(driver->caps,
384
                                  &driver->domains, def, false)))
385 386
        goto cleanup;
    def = NULL;
387
    vm->persistent = 1;
D
Daniel Veillard 已提交
388

389
    if (virDomainSaveConfig(driver->configDir,
390
                            vm->newDef ? vm->newDef : vm->def) < 0) {
391
        virDomainRemoveInactive(&driver->domains, vm);
392
        vm = NULL;
393
        goto cleanup;
D
Daniel Veillard 已提交
394 395
    }

396 397
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
398
                                     !dupVM ?
399 400 401
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                     VIR_DOMAIN_EVENT_DEFINED_UPDATED);

D
Daniel Veillard 已提交
402
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
403
    if (dom)
D
Daniel Veillard 已提交
404 405
        dom->id = vm->def->id;

406 407
cleanup:
    virDomainDefFree(def);
408 409
    if (vm)
        virDomainObjUnlock(vm);
410 411
    if (event)
        lxcDomainEventQueue(driver, event);
412
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
413 414 415 416 417
    return dom;
}

static int lxcDomainUndefine(virDomainPtr dom)
{
418 419
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
420
    virDomainEventPtr event = NULL;
421
    int ret = -1;
D
Daniel Veillard 已提交
422

423
    lxcDriverLock(driver);
424
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel Veillard 已提交
425
    if (!vm) {
426
        lxcError(VIR_ERR_INVALID_DOMAIN,
427
                 "%s", _("No domain with matching uuid"));
428
        goto cleanup;
D
Daniel Veillard 已提交
429 430
    }

D
Daniel P. Berrange 已提交
431
    if (virDomainObjIsActive(vm)) {
432
        lxcError(VIR_ERR_OPERATION_INVALID,
433
                 "%s", _("Cannot delete active domain"));
434
        goto cleanup;
D
Daniel Veillard 已提交
435 436
    }

437
    if (!vm->persistent) {
438
        lxcError(VIR_ERR_OPERATION_INVALID,
439
                 "%s", _("Cannot undefine transient domain"));
440
        goto cleanup;
441
    }
D
Daniel Veillard 已提交
442

443
    if (virDomainDeleteConfig(driver->configDir,
444
                              driver->autostartDir,
445 446
                              vm) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
447

448 449 450 451
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_UNDEFINED,
                                     VIR_DOMAIN_EVENT_UNDEFINED_REMOVED);

452
    virDomainRemoveInactive(&driver->domains, vm);
453
    vm = NULL;
454
    ret = 0;
D
Daniel Veillard 已提交
455

456
cleanup:
457 458
    if (vm)
        virDomainObjUnlock(vm);
459 460
    if (event)
        lxcDomainEventQueue(driver, event);
461
    lxcDriverUnlock(driver);
462
    return ret;
D
Daniel Veillard 已提交
463 464 465 466 467
}

static int lxcDomainGetInfo(virDomainPtr dom,
                            virDomainInfoPtr info)
{
468 469
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
470
    virCgroupPtr cgroup = NULL;
471
    int ret = -1;
D
Daniel Veillard 已提交
472

473
    lxcDriverLock(driver);
474
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
475

D
Daniel Veillard 已提交
476
    if (!vm) {
477
        lxcError(VIR_ERR_INVALID_DOMAIN,
478
                 "%s", _("No domain with matching uuid"));
479
        goto cleanup;
D
Daniel Veillard 已提交
480 481 482 483
    }

    info->state = vm->state;

D
Daniel P. Berrange 已提交
484
    if (!virDomainObjIsActive(vm) || driver->cgroup == NULL) {
D
Daniel Veillard 已提交
485
        info->cpuTime = 0;
R
Ryota Ozaki 已提交
486
        info->memory = vm->def->memory;
D
Daniel Veillard 已提交
487
    } else {
488
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
489
            lxcError(VIR_ERR_INTERNAL_ERROR,
490
                     _("Unable to get cgroup for %s"), vm->def->name);
491 492 493 494
            goto cleanup;
        }

        if (virCgroupGetCpuacctUsage(cgroup, &(info->cpuTime)) < 0) {
495
            lxcError(VIR_ERR_OPERATION_FAILED,
496
                     "%s", _("Cannot read cputime for domain"));
R
Ryota Ozaki 已提交
497 498 499
            goto cleanup;
        }
        if (virCgroupGetMemoryUsage(cgroup, &(info->memory)) < 0) {
500
            lxcError(VIR_ERR_OPERATION_FAILED,
501
                     "%s", _("Cannot read memory usage for domain"));
502 503
            goto cleanup;
        }
D
Daniel Veillard 已提交
504 505
    }

506
    info->maxMem = vm->def->maxmem;
D
Daniel Veillard 已提交
507
    info->nrVirtCpu = 1;
508
    ret = 0;
D
Daniel Veillard 已提交
509

510
cleanup:
511
    lxcDriverUnlock(driver);
512 513
    if (cgroup)
        virCgroupFree(&cgroup);
514 515
    if (vm)
        virDomainObjUnlock(vm);
516
    return ret;
D
Daniel Veillard 已提交
517 518
}

519
static char *lxcGetOSType(virDomainPtr dom)
D
Daniel Veillard 已提交
520
{
521 522 523
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
524

525
    lxcDriverLock(driver);
526
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
527 528
    lxcDriverUnlock(driver);

529
    if (!vm) {
530
        lxcError(VIR_ERR_INVALID_DOMAIN,
531
                 "%s", _("No domain with matching uuid"));
532
        goto cleanup;
533 534
    }

535 536
    ret = strdup(vm->def->os.type);

537
    if (ret == NULL)
538
        virReportOOMError();
539

540
cleanup:
541 542
    if (vm)
        virDomainObjUnlock(vm);
543
    return ret;
D
Daniel Veillard 已提交
544 545
}

R
Ryota Ozaki 已提交
546 547 548 549 550 551 552 553 554 555 556 557 558
/* Returns max memory in kb, 0 if error */
static unsigned long lxcDomainGetMaxMemory(virDomainPtr dom) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned long ret = 0;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
559
        lxcError(VIR_ERR_NO_DOMAIN,
560
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583
        goto cleanup;
    }

    ret = vm->def->maxmem;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMaxMemory(virDomainPtr dom, unsigned long newmax) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
584
        lxcError(VIR_ERR_NO_DOMAIN,
585
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
586 587 588 589
        goto cleanup;
    }

    if (newmax < vm->def->memory) {
590
        lxcError(VIR_ERR_INVALID_ARG,
591
                         "%s", _("Cannot set max memory lower than current memory"));
R
Ryota Ozaki 已提交
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615
        goto cleanup;
    }

    vm->def->maxmem = newmax;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMemory(virDomainPtr dom, unsigned long newmem) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virCgroupPtr cgroup = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
616
        lxcError(VIR_ERR_NO_DOMAIN,
617
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
618 619 620 621
        goto cleanup;
    }

    if (newmem > vm->def->maxmem) {
622
        lxcError(VIR_ERR_INVALID_ARG,
623
                 "%s", _("Cannot set memory higher than max memory"));
R
Ryota Ozaki 已提交
624 625 626
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
627
    if (virDomainObjIsActive(vm)) {
628 629 630 631 632 633
        if (driver->cgroup == NULL) {
            lxcError(VIR_ERR_NO_SUPPORT,
                     "%s", _("cgroups must be configured on the host"));
            goto cleanup;
        }

R
Ryota Ozaki 已提交
634
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
635
            lxcError(VIR_ERR_INTERNAL_ERROR,
R
Ryota Ozaki 已提交
636 637 638 639 640
                     _("Unable to get cgroup for %s\n"), vm->def->name);
            goto cleanup;
        }

        if (virCgroupSetMemory(cgroup, newmem) < 0) {
641
            lxcError(VIR_ERR_OPERATION_FAILED,
642
                     "%s", _("Failed to set memory for domain"));
R
Ryota Ozaki 已提交
643 644 645 646 647 648 649 650 651 652 653 654 655 656 657
            goto cleanup;
        }
    } else {
        vm->def->memory = newmem;
    }
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    if (cgroup)
        virCgroupFree(&cgroup);
    return ret;
}

D
Daniel Veillard 已提交
658
static char *lxcDomainDumpXML(virDomainPtr dom,
659
                              int flags)
D
Daniel Veillard 已提交
660
{
661 662 663
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
D
Daniel Veillard 已提交
664

665
    lxcDriverLock(driver);
666
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
667 668
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
669
    if (!vm) {
670
        lxcError(VIR_ERR_INVALID_DOMAIN,
671
                 "%s", _("No domain with matching uuid"));
672
        goto cleanup;
D
Daniel Veillard 已提交
673 674
    }

675
    ret = virDomainDefFormat((flags & VIR_DOMAIN_XML_INACTIVE) &&
676 677 678 679
                             vm->newDef ? vm->newDef : vm->def,
                             flags);

cleanup:
680 681
    if (vm)
        virDomainObjUnlock(vm);
682
    return ret;
D
Daniel Veillard 已提交
683 684
}

685 686 687

/**
 * lxcVmCleanup:
688 689 690
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to VM to clean up
691 692 693 694 695 696 697
 *
 * waitpid() on the container process.  kill and wait the tty process
 * This is called by both lxcDomainDestroy and lxcSigHandler when a
 * container exits.
 *
 * Returns 0 on success or -1 in case of error
 */
698
static int lxcVmCleanup(lxc_driver_t *driver,
699
                        virDomainObjPtr  vm)
700 701 702 703
{
    int rc = -1;
    int waitRc;
    int childStatus = -1;
D
Dan Smith 已提交
704
    virCgroupPtr cgroup;
705
    int i;
706
    lxcDomainObjPrivatePtr priv = vm->privateData;
707 708 709 710 711 712

    while (((waitRc = waitpid(vm->pid, &childStatus, 0)) == -1) &&
           errno == EINTR)
        ; /* empty */

    if ((waitRc != vm->pid) && (errno != ECHILD)) {
713
        virReportSystemError(errno,
714 715
                             _("waitpid failed to wait for container %d: %d"),
                             vm->pid, waitRc);
716 717 718 719 720 721 722 723 724
    }

    rc = 0;

    if (WIFEXITED(childStatus)) {
        rc = WEXITSTATUS(childStatus);
        DEBUG("container exited with rc: %d", rc);
    }

725 726
    virEventRemoveHandle(priv->monitorWatch);
    close(priv->monitor);
727 728

    virFileDeletePid(driver->stateDir, vm->def->name);
729
    virDomainDeleteConfig(driver->stateDir, NULL, vm);
730 731 732 733

    vm->state = VIR_DOMAIN_SHUTOFF;
    vm->pid = -1;
    vm->def->id = -1;
734 735
    priv->monitor = -1;
    priv->monitorWatch = -1;
736

737 738 739
    for (i = 0 ; i < vm->def->nnets ; i++) {
        vethInterfaceUpOrDown(vm->def->nets[i]->ifname, 0);
        vethDelete(vm->def->nets[i]->ifname);
740 741
    }

742 743
    if (driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0) {
D
Dan Smith 已提交
744 745 746 747
        virCgroupRemove(cgroup);
        virCgroupFree(&cgroup);
    }

748 749 750 751 752 753 754
    if (vm->newDef) {
        virDomainDefFree(vm->def);
        vm->def = vm->newDef;
        vm->def->id = -1;
        vm->newDef = NULL;
    }

755 756 757
    return rc;
}

758 759
/**
 * lxcSetupInterfaces:
760
 * @conn: pointer to connection
761
 * @def: pointer to virtual machine structure
762 763
 * @nveths: number of interfaces
 * @veths: interface names
764 765 766 767 768 769 770 771
 *
 * Sets up the container interfaces by creating the veth device pairs and
 * attaching the parent end to the appropriate bridge.  The container end
 * will moved into the container namespace later after clone has been called.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcSetupInterfaces(virConnectPtr conn,
772
                              virDomainDefPtr def,
773 774
                              unsigned int *nveths,
                              char ***veths)
775
{
776
    int rc = -1, i;
777
    char *bridge = NULL;
778 779
    char parentVeth[PATH_MAX] = "";
    char containerVeth[PATH_MAX] = "";
780
    brControl *brctl = NULL;
781

782
    if (brInit(&brctl) != 0)
783 784
        return -1;

785 786
    for (i = 0 ; i < def->nnets ; i++) {
        switch (def->nets[i]->type) {
787 788 789
        case VIR_DOMAIN_NET_TYPE_NETWORK:
        {
            virNetworkPtr network = virNetworkLookupByName(conn,
790
                                                           def->nets[i]->data.network.name);
791 792 793 794 795 796 797
            if (!network) {
                goto error_exit;
            }

            bridge = virNetworkGetBridgeName(network);

            virNetworkFree(network);
798 799 800
            break;
        }
        case VIR_DOMAIN_NET_TYPE_BRIDGE:
801
            bridge = def->nets[i]->data.bridge.brname;
802
            break;
S
Stefan Berger 已提交
803 804 805 806 807 808 809 810 811 812

        case VIR_DOMAIN_NET_TYPE_USER:
        case VIR_DOMAIN_NET_TYPE_ETHERNET:
        case VIR_DOMAIN_NET_TYPE_SERVER:
        case VIR_DOMAIN_NET_TYPE_CLIENT:
        case VIR_DOMAIN_NET_TYPE_MCAST:
        case VIR_DOMAIN_NET_TYPE_INTERNAL:
        case VIR_DOMAIN_NET_TYPE_DIRECT:
        case VIR_DOMAIN_NET_TYPE_LAST:
            break;
813 814 815 816
        }

        DEBUG("bridge: %s", bridge);
        if (NULL == bridge) {
817
            lxcError(VIR_ERR_INTERNAL_ERROR,
818
                     "%s", _("Failed to get bridge for interface"));
819 820 821 822
            goto error_exit;
        }

        DEBUG0("calling vethCreate()");
823 824
        if (NULL != def->nets[i]->ifname) {
            strcpy(parentVeth, def->nets[i]->ifname);
825 826 827
        }
        DEBUG("parentVeth: %s, containerVeth: %s", parentVeth, containerVeth);
        if (0 != (rc = vethCreate(parentVeth, PATH_MAX, containerVeth, PATH_MAX))) {
828
            lxcError(VIR_ERR_INTERNAL_ERROR,
829
                     _("Failed to create veth device pair: %d"), rc);
830 831
            goto error_exit;
        }
832 833
        if (NULL == def->nets[i]->ifname) {
            def->nets[i]->ifname = strdup(parentVeth);
834
        }
835
        if (VIR_REALLOC_N(*veths, (*nveths)+1) < 0) {
836
            virReportOOMError();
837
            goto error_exit;
838 839
        }
        if (((*veths)[(*nveths)] = strdup(containerVeth)) == NULL) {
840
            virReportOOMError();
841
            goto error_exit;
842 843
        }
        (*nveths)++;
844

845
        if (NULL == def->nets[i]->ifname) {
846
            virReportOOMError();
847 848 849
            goto error_exit;
        }

850
        {
851 852 853
            char macaddr[VIR_MAC_STRING_BUFLEN];
            virFormatMacAddr(def->nets[i]->mac, macaddr);
            if (0 != (rc = setMacAddr(containerVeth, macaddr))) {
854
                virReportSystemError(rc,
855
                                     _("Failed to set %s to %s"),
856 857 858 859 860
                                     macaddr, containerVeth);
                goto error_exit;
            }
        }

861
        if (0 != (rc = brAddInterface(brctl, bridge, parentVeth))) {
862
            virReportSystemError(rc,
863
                                 _("Failed to add %s device to %s"),
864
                                 parentVeth, bridge);
865 866 867 868
            goto error_exit;
        }

        if (0 != (rc = vethInterfaceUpOrDown(parentVeth, 1))) {
869
            virReportSystemError(rc,
870 871
                                 _("Failed to enable %s device"),
                                 parentVeth);
872 873 874 875 876 877 878 879
            goto error_exit;
        }

    }

    rc = 0;

error_exit:
880
    brShutdown(brctl);
881 882 883
    return rc;
}

884

885
static int lxcMonitorClient(lxc_driver_t * driver,
886
                            virDomainObjPtr vm)
887
{
888 889 890
    char *sockpath = NULL;
    int fd;
    struct sockaddr_un addr;
891

892 893
    if (virAsprintf(&sockpath, "%s/%s.sock",
                    driver->stateDir, vm->def->name) < 0) {
894
        virReportOOMError();
895 896 897 898
        return -1;
    }

    if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
899
        virReportSystemError(errno, "%s",
900
                             _("Failed to create client socket"));
901
        goto error;
902 903
    }

904 905
    memset(&addr, 0, sizeof(addr));
    addr.sun_family = AF_UNIX;
C
Chris Lalancette 已提交
906
    if (virStrcpyStatic(addr.sun_path, sockpath) == NULL) {
907
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
908 909 910
                 _("Socket path %s too big for destination"), sockpath);
        goto error;
    }
911 912

    if (connect(fd, (struct sockaddr *) &addr, sizeof(addr)) < 0) {
913
        virReportSystemError(errno, "%s",
914
                             _("Failed to connect to client socket"));
915
        goto error;
916 917
    }

918 919
    VIR_FREE(sockpath);
    return fd;
920

921 922 923 924 925 926 927 928
error:
    VIR_FREE(sockpath);
    if (fd != -1)
        close(fd);
    return -1;
}


929
static int lxcVmTerminate(lxc_driver_t *driver,
930
                          virDomainObjPtr vm,
931 932 933 934
                          int signum)
{
    if (signum == 0)
        signum = SIGINT;
935

936
    if (vm->pid <= 0) {
937
        lxcError(VIR_ERR_INTERNAL_ERROR,
938
                 _("Invalid PID %d for container"), vm->pid);
939 940 941
        return -1;
    }

942 943
    if (kill(vm->pid, signum) < 0) {
        if (errno != ESRCH) {
944
            virReportSystemError(errno,
945
                                 _("Failed to kill pid %d"),
946
                                 vm->pid);
947
            return -1;
948
        }
949 950
    }

951
    vm->state = VIR_DOMAIN_SHUTDOWN;
952

953
    return lxcVmCleanup(driver, vm);
954
}
955

956 957
static void lxcMonitorEvent(int watch,
                            int fd,
958 959 960
                            int events ATTRIBUTE_UNUSED,
                            void *data)
{
961 962
    lxc_driver_t *driver = lxc_driver;
    virDomainObjPtr vm = data;
963
    virDomainEventPtr event = NULL;
964
    lxcDomainObjPrivatePtr priv;
965

966
    lxcDriverLock(driver);
967 968
    virDomainObjLock(vm);
    lxcDriverUnlock(driver);
969

970 971 972
    priv = vm->privateData;

    if (priv->monitor != fd || priv->monitorWatch != watch) {
973
        virEventRemoveHandle(watch);
974
        goto cleanup;
975 976
    }

977
    if (lxcVmTerminate(driver, vm, SIGINT) < 0) {
978
        virEventRemoveHandle(watch);
979 980 981 982 983
    } else {
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
    }
984 985 986 987
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
988 989

cleanup:
990 991
    if (vm)
        virDomainObjUnlock(vm);
992 993
    if (event) {
        lxcDriverLock(driver);
994
        lxcDomainEventQueue(driver, event);
995 996
        lxcDriverUnlock(driver);
    }
997 998 999
}


1000
static int lxcControllerStart(lxc_driver_t *driver,
1001 1002 1003 1004 1005 1006 1007 1008 1009 1010
                              virDomainObjPtr vm,
                              int nveths,
                              char **veths,
                              int appPty,
                              int logfd)
{
    int i;
    int rc;
    int largc = 0, larga = 0;
    const char **largv = NULL;
A
Amy Griffis 已提交
1011 1012 1013 1014 1015
    int lenvc = 0, lenva = 0;
    const char **lenv = NULL;
    char *filterstr;
    char *outputstr;
    char *tmp;
A
Amy Griffis 已提交
1016
    int log_level;
1017 1018
    pid_t child;
    int status;
1019 1020
    fd_set keepfd;
    char appPtyStr[30];
1021
    const char *emulator;
1022 1023

    FD_ZERO(&keepfd);
1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046

#define ADD_ARG_SPACE                                                   \
    do { \
        if (largc == larga) {                                           \
            larga += 10;                                                \
            if (VIR_REALLOC_N(largv, larga) < 0)                        \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ARG(thisarg)                                                \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        largv[largc++] = thisarg;                                       \
    } while (0)

#define ADD_ARG_LIT(thisarg)                                            \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        if ((largv[largc++] = strdup(thisarg)) == NULL)                 \
            goto no_memory;                                             \
    } while (0)

A
Amy Griffis 已提交
1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070
#define ADD_ENV_SPACE                                                   \
    do {                                                                \
        if (lenvc == lenva) {                                           \
            lenva += 10;                                                \
            if (VIR_REALLOC_N(lenv, lenva) < 0)                         \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ENV(thisarg)                                                \
    do {                                                                \
        ADD_ENV_SPACE;                                                  \
        lenv[lenvc++] = thisarg;                                        \
    } while (0)

#define ADD_ENV_PAIR(envname, val)                                      \
    do {                                                                \
        char *envval;                                                   \
        ADD_ENV_SPACE;                                                  \
        if (virAsprintf(&envval, "%s=%s", envname, val) < 0)            \
            goto no_memory;                                             \
        lenv[lenvc++] = envval;                                         \
    } while (0)

1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083
#define ADD_ENV_COPY(envname)                                           \
    do {                                                                \
        char *val = getenv(envname);                                    \
        if (val != NULL) {                                              \
            ADD_ENV_PAIR(envname, val);                                 \
        }                                                               \
    } while (0)

    /*
     * The controller may call ip command, so we have to remain PATH.
     */
    ADD_ENV_COPY("PATH");

A
Amy Griffis 已提交
1084 1085
    log_level = virLogGetDefaultPriority();
    if (virAsprintf(&tmp, "LIBVIRT_DEBUG=%d", log_level) < 0)
A
Amy Griffis 已提交
1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096
        goto no_memory;
    ADD_ENV(tmp);

    if (virLogGetNbFilters() > 0) {
        filterstr = virLogGetFilters();
        if (!filterstr)
            goto no_memory;
        ADD_ENV_PAIR("LIBVIRT_LOG_FILTERS", filterstr);
        VIR_FREE(filterstr);
    }

A
Amy Griffis 已提交
1097 1098 1099 1100 1101 1102 1103 1104 1105 1106
    if (driver->log_libvirtd) {
        if (virLogGetNbOutputs() > 0) {
            outputstr = virLogGetOutputs();
            if (!outputstr)
                goto no_memory;
            ADD_ENV_PAIR("LIBVIRT_LOG_OUTPUTS", outputstr);
            VIR_FREE(outputstr);
        }
    } else {
        if (virAsprintf(&tmp, "LIBVIRT_LOG_OUTPUTS=%d:stderr", log_level) < 0)
A
Amy Griffis 已提交
1107
            goto no_memory;
A
Amy Griffis 已提交
1108
        ADD_ENV(tmp);
A
Amy Griffis 已提交
1109 1110 1111 1112
    }

    ADD_ENV(NULL);

1113 1114
    snprintf(appPtyStr, sizeof(appPtyStr), "%d", appPty);

1115 1116 1117
    emulator = vm->def->emulator;

    ADD_ARG_LIT(emulator);
1118 1119 1120
    ADD_ARG_LIT("--name");
    ADD_ARG_LIT(vm->def->name);
    ADD_ARG_LIT("--console");
1121
    ADD_ARG_LIT(appPtyStr);
1122 1123 1124 1125 1126 1127 1128 1129 1130
    ADD_ARG_LIT("--background");

    for (i = 0 ; i < nveths ; i++) {
        ADD_ARG_LIT("--veth");
        ADD_ARG_LIT(veths[i]);
    }

    ADD_ARG(NULL);

1131 1132
    FD_SET(appPty, &keepfd);

1133
    if (virExec(largv, lenv, &keepfd, &child,
1134
                -1, &logfd, &logfd,
1135 1136 1137 1138 1139 1140 1141 1142 1143
                VIR_EXEC_NONE) < 0)
        goto cleanup;

    /* We now wait for the process to exit - the controller
     * will fork() itself into the background - waiting for
     * it to exit thus guarentees it has written its pidfile
     */
    while ((rc = waitpid(child, &status, 0) == -1) && errno == EINTR);
    if (rc == -1) {
1144
        virReportSystemError(errno,
1145
                             _("Cannot wait for '%s'"),
1146
                             largv[0]);
1147 1148 1149 1150
        goto cleanup;
    }

    if (!(WIFEXITED(status) && WEXITSTATUS(status) == 0)) {
1151
        lxcError(VIR_ERR_INTERNAL_ERROR,
1152
                 _("Container '%s' unexpectedly shutdown during startup"),
1153 1154 1155 1156 1157 1158 1159
                 largv[0]);
        goto cleanup;
    }

#undef ADD_ARG
#undef ADD_ARG_LIT
#undef ADD_ARG_SPACE
A
Amy Griffis 已提交
1160 1161
#undef ADD_ENV_SPACE
#undef ADD_ENV_PAIR
1162

A
Amy Griffis 已提交
1163
    return 0;
1164 1165

no_memory:
1166
    virReportOOMError();
A
Amy Griffis 已提交
1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178
cleanup:
    if (largv) {
        for (i = 0 ; i < largc ; i++)
            VIR_FREE(largv[i]);
        VIR_FREE(largv);
    }
    if (lenv) {
        for (i=0 ; i < lenvc ; i++)
            VIR_FREE(lenv[i]);
        VIR_FREE(lenv);
    }
    return -1;
1179 1180 1181
}


1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193
/**
 * lxcVmStart:
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to virtual machine structure
 *
 * Starts a vm
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcVmStart(virConnectPtr conn,
                      lxc_driver_t * driver,
1194
                      virDomainObjPtr  vm)
1195
{
1196
    int rc = -1, r;
1197 1198
    unsigned int i;
    int parentTty;
1199
    char *parentTtyPath = NULL;
1200 1201 1202 1203
    char *logfile = NULL;
    int logfd = -1;
    unsigned int nveths = 0;
    char **veths = NULL;
1204
    lxcDomainObjPrivatePtr priv = vm->privateData;
1205

L
Laine Stump 已提交
1206
    if ((r = virFileMakePath(driver->logDir)) != 0) {
1207
        virReportSystemError(r,
1208
                             _("Cannot create log directory '%s'"),
1209
                             driver->logDir);
1210 1211
        return -1;
    }
1212

1213 1214
    if (virAsprintf(&logfile, "%s/%s.log",
                    driver->logDir, vm->def->name) < 0) {
1215
        virReportOOMError();
1216
        return -1;
1217 1218
    }

1219
    /* open parent tty */
1220
    if (virFileOpenTty(&parentTty, &parentTtyPath, 1) < 0) {
1221
        virReportSystemError(errno, "%s",
1222
                             _("Failed to allocate tty"));
1223 1224
        goto cleanup;
    }
1225 1226 1227 1228 1229 1230 1231
    if (vm->def->console &&
        vm->def->console->type == VIR_DOMAIN_CHR_TYPE_PTY) {
        VIR_FREE(vm->def->console->data.file.path);
        vm->def->console->data.file.path = parentTtyPath;
    } else {
        VIR_FREE(parentTtyPath);
    }
1232

1233
    if (lxcSetupInterfaces(conn, vm->def, &nveths, &veths) != 0)
1234
        goto cleanup;
1235

1236
    /* Persist the live configuration now we have veth & tty info */
1237
    if (virDomainSaveConfig(driver->stateDir, vm->def) < 0)
1238 1239
        goto cleanup;

1240
    if ((logfd = open(logfile, O_WRONLY | O_APPEND | O_CREAT,
1241
             S_IRUSR|S_IWUSR)) < 0) {
1242
        virReportSystemError(errno,
1243
                             _("Failed to open '%s'"),
1244
                             logfile);
1245
        goto cleanup;
1246 1247
    }

1248
    if (lxcControllerStart(driver,
1249 1250 1251
                           vm,
                           nveths, veths,
                           parentTty, logfd) < 0)
1252
        goto cleanup;
1253 1254 1255 1256

    /* Connect to the controller as a client *first* because
     * this will block until the child has written their
     * pid file out to disk */
1257
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0)
1258 1259
        goto cleanup;

1260
    /* And get its pid */
1261
    if ((r = virFileReadPid(driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1262
        virReportSystemError(r,
1263 1264
                             _("Failed to read pid file %s/%s.pid"),
                             driver->stateDir, vm->def->name);
1265
        goto cleanup;
1266
    }
1267

1268
    vm->def->id = vm->pid;
1269 1270
    vm->state = VIR_DOMAIN_RUNNING;

1271 1272
    if ((priv->monitorWatch = virEventAddHandle(
             priv->monitor,
1273 1274
             VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
             lxcMonitorEvent,
1275
             vm, NULL)) < 0) {
1276
        lxcVmTerminate(driver, vm, 0);
1277 1278
        goto cleanup;
    }
1279

1280 1281 1282 1283 1284 1285 1286 1287
    rc = 0;

cleanup:
    for (i = 0 ; i < nveths ; i++) {
        if (rc != 0)
            vethDelete(veths[i]);
        VIR_FREE(veths[i]);
    }
1288 1289 1290
    if (rc != 0 && priv->monitor != -1) {
        close(priv->monitor);
        priv->monitor = -1;
1291 1292 1293 1294 1295 1296
    }
    if (parentTty != -1)
        close(parentTty);
    if (logfd != -1)
        close(logfd);
    VIR_FREE(logfile);
1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309
    return rc;
}

/**
 * lxcDomainStart:
 * @dom: domain to start
 *
 * Looks up domain and starts it.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainStart(virDomainPtr dom)
{
1310 1311
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1312
    virDomainEventPtr event = NULL;
1313
    int ret = -1;
1314

1315
    lxcDriverLock(driver);
1316
    vm = virDomainFindByName(&driver->domains, dom->name);
1317
    if (!vm) {
1318
        lxcError(VIR_ERR_INVALID_DOMAIN,
1319
                 _("No domain named %s"), dom->name);
1320 1321 1322
        goto cleanup;
    }

1323
    if ((vm->def->nets != NULL) && !(driver->have_netns)) {
1324
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1325
                 "%s", _("System lacks NETNS support"));
1326 1327 1328
        goto cleanup;
    }

1329
    ret = lxcVmStart(dom->conn, driver, vm);
1330

1331 1332 1333 1334 1335
    if (ret == 0)
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);

1336
cleanup:
1337 1338
    if (vm)
        virDomainObjUnlock(vm);
1339 1340
    if (event)
        lxcDomainEventQueue(driver, event);
1341
    lxcDriverUnlock(driver);
1342
    return ret;
1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358
}

/**
 * lxcDomainCreateAndStart:
 * @conn: pointer to connection
 * @xml: XML definition of domain
 * @flags: Unused
 *
 * Creates a domain based on xml and starts it
 *
 * Returns 0 on success or -1 in case of error
 */
static virDomainPtr
lxcDomainCreateAndStart(virConnectPtr conn,
                        const char *xml,
                        unsigned int flags ATTRIBUTE_UNUSED) {
1359
    lxc_driver_t *driver = conn->privateData;
1360
    virDomainObjPtr vm = NULL;
1361
    virDomainDefPtr def;
1362
    virDomainPtr dom = NULL;
1363
    virDomainEventPtr event = NULL;
1364

1365
    lxcDriverLock(driver);
1366
    if (!(def = virDomainDefParseString(driver->caps, xml,
1367
                                        VIR_DOMAIN_XML_INACTIVE)))
1368
        goto cleanup;
1369

1370 1371
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
1372

1373
    if ((def->nets != NULL) && !(driver->have_netns)) {
1374
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1375
                 "%s", _("System lacks NETNS support"));
1376
        goto cleanup;
1377 1378
    }

1379

1380
    if (!(vm = virDomainAssignDef(driver->caps,
1381
                                  &driver->domains, def, false)))
1382 1383
        goto cleanup;
    def = NULL;
1384 1385

    if (lxcVmStart(conn, driver, vm) < 0) {
1386
        virDomainRemoveInactive(&driver->domains, vm);
1387
        vm = NULL;
1388
        goto cleanup;
1389 1390
    }

1391 1392 1393 1394
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);

1395
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
1396
    if (dom)
1397 1398
        dom->id = vm->def->id;

1399 1400
cleanup:
    virDomainDefFree(def);
1401 1402
    if (vm)
        virDomainObjUnlock(vm);
1403 1404
    if (event)
        lxcDomainEventQueue(driver, event);
1405
    lxcDriverUnlock(driver);
1406 1407 1408 1409 1410
    return dom;
}

/**
 * lxcDomainShutdown:
1411
 * @dom: pointer to domain to shutdown
1412 1413 1414 1415 1416 1417 1418
 *
 * Sends SIGINT to container root process to request it to shutdown
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainShutdown(virDomainPtr dom)
{
1419 1420
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1421
    virDomainEventPtr event = NULL;
1422
    int ret = -1;
1423

1424
    lxcDriverLock(driver);
1425
    vm = virDomainFindByID(&driver->domains, dom->id);
1426
    if (!vm) {
1427
        lxcError(VIR_ERR_INVALID_DOMAIN,
1428
                 _("No domain with id %d"), dom->id);
1429
        goto cleanup;
1430 1431
    }

1432
    ret = lxcVmTerminate(driver, vm, 0);
1433 1434 1435
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
1436 1437 1438 1439
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1440 1441

cleanup:
1442 1443
    if (vm)
        virDomainObjUnlock(vm);
1444 1445 1446 1447 1448 1449 1450 1451
    if (event)
        lxcDomainEventQueue(driver, event);
    lxcDriverUnlock(driver);
    return ret;
}


static int
1452 1453 1454 1455
lxcDomainEventRegister(virConnectPtr conn,
                       virConnectDomainEventCallback callback,
                       void *opaque,
                       virFreeCallback freecb)
1456 1457 1458 1459 1460 1461 1462
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    ret = virDomainEventCallbackListAdd(conn, driver->domainEventCallbacks,
                                        callback, opaque, freecb);
1463
    lxcDriverUnlock(driver);
1464

1465
    return ret;
1466 1467
}

1468

1469
static int
1470 1471
lxcDomainEventDeregister(virConnectPtr conn,
                         virConnectDomainEventCallback callback)
1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDelete(conn, driver->domainEventCallbacks,
                                                   callback);
    else
        ret = virDomainEventCallbackListRemove(conn, driver->domainEventCallbacks,
                                               callback);
    lxcDriverUnlock(driver);

    return ret;
}

1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530

static int
lxcDomainEventRegisterAny(virConnectPtr conn,
                          virDomainPtr dom,
                          int eventID,
                          virConnectDomainEventGenericCallback callback,
                          void *opaque,
                          virFreeCallback freecb)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    ret = virDomainEventCallbackListAddID(conn,
                                          driver->domainEventCallbacks,
                                          dom, eventID,
                                          callback, opaque, freecb);
    lxcDriverUnlock(driver);

    return ret;
}


static int
lxcDomainEventDeregisterAny(virConnectPtr conn,
                            int callbackID)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDeleteID(conn, driver->domainEventCallbacks,
                                                     callbackID);
    else
        ret = virDomainEventCallbackListRemoveID(conn, driver->domainEventCallbacks,
                                                 callbackID);
    lxcDriverUnlock(driver);

    return ret;
}


1531 1532
static void lxcDomainEventDispatchFunc(virConnectPtr conn,
                                       virDomainEventPtr event,
1533
                                       virConnectDomainEventGenericCallback cb,
1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584
                                       void *cbopaque,
                                       void *opaque)
{
    lxc_driver_t *driver = opaque;

    /* Drop the lock whle dispatching, for sake of re-entrancy */
    lxcDriverUnlock(driver);
    virDomainEventDispatchDefaultFunc(conn, event, cb, cbopaque, NULL);
    lxcDriverLock(driver);
}


static void lxcDomainEventFlush(int timer ATTRIBUTE_UNUSED, void *opaque)
{
    lxc_driver_t *driver = opaque;
    virDomainEventQueue tempQueue;

    lxcDriverLock(driver);

    driver->domainEventDispatching = 1;

    /* Copy the queue, so we're reentrant safe */
    tempQueue.count = driver->domainEventQueue->count;
    tempQueue.events = driver->domainEventQueue->events;
    driver->domainEventQueue->count = 0;
    driver->domainEventQueue->events = NULL;

    virEventUpdateTimeout(driver->domainEventTimer, -1);
    virDomainEventQueueDispatch(&tempQueue,
                                driver->domainEventCallbacks,
                                lxcDomainEventDispatchFunc,
                                driver);

    /* Purge any deleted callbacks */
    virDomainEventCallbackListPurgeMarked(driver->domainEventCallbacks);

    driver->domainEventDispatching = 0;
    lxcDriverUnlock(driver);
}


/* driver must be locked before calling */
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                 virDomainEventPtr event)
{
    if (virDomainEventQueuePush(driver->domainEventQueue,
                                event) < 0)
        virDomainEventFree(event);
    if (lxc_driver->domainEventQueue->count == 1)
        virEventUpdateTimeout(driver->domainEventTimer, 0);
}
1585 1586 1587

/**
 * lxcDomainDestroy:
1588
 * @dom: pointer to domain to destroy
1589 1590 1591 1592 1593 1594 1595
 *
 * Sends SIGKILL to container root process to terminate the container
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainDestroy(virDomainPtr dom)
{
1596 1597
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1598
    virDomainEventPtr event = NULL;
1599
    int ret = -1;
1600

1601
    lxcDriverLock(driver);
1602
    vm = virDomainFindByID(&driver->domains, dom->id);
1603
    if (!vm) {
1604
        lxcError(VIR_ERR_INVALID_DOMAIN,
1605
                 _("No domain with id %d"), dom->id);
1606
        goto cleanup;
1607 1608
    }

1609
    ret = lxcVmTerminate(driver, vm, SIGKILL);
1610 1611 1612
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_DESTROYED);
1613 1614 1615 1616
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1617 1618

cleanup:
1619 1620
    if (vm)
        virDomainObjUnlock(vm);
1621 1622
    if (event)
        lxcDomainEventQueue(driver, event);
1623
    lxcDriverUnlock(driver);
1624
    return ret;
1625
}
1626

1627 1628 1629 1630 1631
static int lxcCheckNetNsSupport(void)
{
    const char *argv[] = {"ip", "link", "set", "lo", "netns", "-1", NULL};
    int ip_rc;

1632
    if (virRun(argv, &ip_rc) < 0 ||
1633 1634
        !(WIFEXITED(ip_rc) && (WEXITSTATUS(ip_rc) != 255)))
        return 0;
1635

1636 1637
    if (lxcContainerAvailable(LXC_CONTAINER_FEATURE_NET) < 0)
        return 0;
1638

1639
    return 1;
1640 1641
}

1642

1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655
struct lxcAutostartData {
    lxc_driver_t *driver;
    virConnectPtr conn;
};

static void
lxcAutostartDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    const struct lxcAutostartData *data = opaque;

    virDomainObjLock(vm);
    if (vm->autostart &&
D
Daniel P. Berrange 已提交
1656
        !virDomainObjIsActive(vm)) {
1657 1658 1659
        int ret = lxcVmStart(data->conn, data->driver, vm);
        if (ret < 0) {
            virErrorPtr err = virGetLastError();
1660
            VIR_ERROR(_("Failed to autostart VM '%s': %s"),
1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674
                      vm->def->name,
                      err ? err->message : "");
        } else {
            virDomainEventPtr event =
                virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);
            if (event)
                lxcDomainEventQueue(data->driver, event);
        }
    }
    virDomainObjUnlock(vm);
}

1675 1676 1677 1678 1679 1680 1681 1682 1683 1684
static void
lxcAutostartConfigs(lxc_driver_t *driver) {
    /* XXX: Figure out a better way todo this. The domain
     * startup code needs a connection handle in order
     * to lookup the bridge associated with a virtual
     * network
     */
    virConnectPtr conn = virConnectOpen("lxc:///");
    /* Ignoring NULL conn which is mostly harmless here */

1685 1686
    struct lxcAutostartData data = { driver, conn };

1687
    lxcDriverLock(driver);
1688
    virHashForEach(driver->domains.objs, lxcAutostartDomain, &data);
1689 1690 1691 1692 1693 1694
    lxcDriverUnlock(driver);

    if (conn)
        virConnectClose(conn);
}

1695 1696 1697 1698 1699 1700 1701
static void
lxcReconnectVM(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    lxc_driver_t *driver = opaque;
    char *config = NULL;
    virDomainDefPtr tmp;
1702
    lxcDomainObjPrivatePtr priv;
1703 1704

    virDomainObjLock(vm);
1705 1706

    priv = vm->privateData;
1707
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0) {
1708 1709 1710 1711 1712
        goto cleanup;
    }

    /* Read pid from controller */
    if ((virFileReadPid(lxc_driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1713 1714
        close(priv->monitor);
        priv->monitor = -1;
1715 1716 1717
        goto cleanup;
    }

1718
    if ((config = virDomainConfigFile(driver->stateDir,
1719 1720 1721 1722
                                      vm->def->name)) == NULL)
        goto cleanup;

    /* Try and load the live config */
1723
    tmp = virDomainDefParseFile(driver->caps, config, 0);
1724 1725 1726 1727 1728 1729 1730 1731 1732
    VIR_FREE(config);
    if (tmp) {
        vm->newDef = vm->def;
        vm->def = tmp;
    }

    if (vm->pid != 0) {
        vm->def->id = vm->pid;
        vm->state = VIR_DOMAIN_RUNNING;
1733 1734 1735 1736 1737 1738

        if ((priv->monitorWatch = virEventAddHandle(
                 priv->monitor,
                 VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
                 lxcMonitorEvent,
                 vm, NULL)) < 0) {
1739
            lxcVmTerminate(driver, vm, 0);
1740 1741
            goto cleanup;
        }
1742 1743
    } else {
        vm->def->id = -1;
1744 1745
        close(priv->monitor);
        priv->monitor = -1;
1746 1747 1748 1749 1750 1751
    }

cleanup:
    virDomainObjUnlock(vm);
}

1752

1753
static int lxcStartup(int privileged)
D
Daniel Veillard 已提交
1754
{
1755
    char *ld;
1756
    int rc;
1757 1758 1759 1760 1761 1762

    /* Valgrind gets very annoyed when we clone containers, so
     * disable LXC when under valgrind
     * XXX remove this when valgrind is fixed
     */
    ld = getenv("LD_PRELOAD");
1763 1764 1765 1766
    if (ld && strstr(ld, "vgpreload")) {
        VIR_INFO0("Running under valgrind, disabling driver");
        return 0;
    }
1767

1768
    /* Check that the user is root, silently disable if not */
1769
    if (!privileged) {
1770 1771 1772 1773 1774 1775 1776 1777
        VIR_INFO0("Not running privileged, disabling driver");
        return 0;
    }

    /* Check that this is a container enabled kernel */
    if (lxcContainerAvailable(0) < 0) {
        VIR_INFO0("LXC support not available in this kernel, disabling driver");
        return 0;
1778 1779
    }

1780
    if (VIR_ALLOC(lxc_driver) < 0) {
1781 1782
        return -1;
    }
1783 1784 1785 1786
    if (virMutexInit(&lxc_driver->lock) < 0) {
        VIR_FREE(lxc_driver);
        return -1;
    }
1787
    lxcDriverLock(lxc_driver);
D
Daniel Veillard 已提交
1788

1789 1790 1791
    if (virDomainObjListInit(&lxc_driver->domains) < 0)
        goto cleanup;

1792
    if (VIR_ALLOC(lxc_driver->domainEventCallbacks) < 0)
1793 1794 1795 1796 1797 1798 1799 1800
        goto cleanup;
    if (!(lxc_driver->domainEventQueue = virDomainEventQueueNew()))
        goto cleanup;

    if ((lxc_driver->domainEventTimer =
         virEventAddTimeout(-1, lxcDomainEventFlush, lxc_driver, NULL)) < 0)
        goto cleanup;

A
Amy Griffis 已提交
1801
    lxc_driver->log_libvirtd = 0; /* by default log to container logfile */
1802
    lxc_driver->have_netns = lxcCheckNetNsSupport();
D
Daniel Veillard 已提交
1803

1804 1805 1806 1807 1808 1809 1810
    rc = virCgroupForDriver("lxc", &lxc_driver->cgroup, privileged, 1);
    if (rc < 0) {
        char buf[1024];
        VIR_WARN("Unable to create cgroup for driver: %s",
                 virStrerror(-rc, buf, sizeof(buf)));
    }

D
Daniel Veillard 已提交
1811
    /* Call function to load lxc driver configuration information */
1812 1813
    if (lxcLoadDriverConfig(lxc_driver) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
1814

1815 1816
    if ((lxc_driver->caps = lxcCapsInit()) == NULL)
        goto cleanup;
D
Daniel Veillard 已提交
1817

1818 1819 1820
    lxc_driver->caps->privateDataAllocFunc = lxcDomainObjPrivateAlloc;
    lxc_driver->caps->privateDataFreeFunc = lxcDomainObjPrivateFree;

1821
    if (virDomainLoadAllConfigs(lxc_driver->caps,
1822 1823
                                &lxc_driver->domains,
                                lxc_driver->configDir,
1824
                                lxc_driver->autostartDir,
1825
                                0, NULL, NULL) < 0)
1826
        goto cleanup;
1827

1828
    virHashForEach(lxc_driver->domains.objs, lxcReconnectVM, lxc_driver);
1829

1830
    lxcDriverUnlock(lxc_driver);
D
Daniel Veillard 已提交
1831 1832
    return 0;

1833 1834 1835 1836
cleanup:
    lxcDriverUnlock(lxc_driver);
    lxcShutdown();
    return -1;
D
Daniel Veillard 已提交
1837 1838
}

1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864
static void lxcNotifyLoadDomain(virDomainObjPtr vm, int newVM, void *opaque)
{
    lxc_driver_t *driver = opaque;

    if (newVM) {
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED);
        if (event)
            lxcDomainEventQueue(driver, event);
    }
}

/**
 * lxcReload:
 *
 * Function to restart the LXC driver, it will recheck the configuration
 * files and perform autostart
 */
static int
lxcReload(void) {
    if (!lxc_driver)
        return 0;

    lxcDriverLock(lxc_driver);
1865
    virDomainLoadAllConfigs(lxc_driver->caps,
1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876
                            &lxc_driver->domains,
                            lxc_driver->configDir,
                            lxc_driver->autostartDir,
                            0, lxcNotifyLoadDomain, lxc_driver);
    lxcDriverUnlock(lxc_driver);

    lxcAutostartConfigs(lxc_driver);

    return 0;
}

1877
static int lxcShutdown(void)
D
Daniel Veillard 已提交
1878
{
1879
    if (lxc_driver == NULL)
1880
        return(-1);
1881

1882
    lxcDriverLock(lxc_driver);
1883
    virDomainObjListDeinit(&lxc_driver->domains);
1884

1885 1886 1887 1888 1889 1890
    virDomainEventCallbackListFree(lxc_driver->domainEventCallbacks);
    virDomainEventQueueFree(lxc_driver->domainEventQueue);

    if (lxc_driver->domainEventTimer != -1)
        virEventRemoveTimeout(lxc_driver->domainEventTimer);

1891 1892 1893 1894 1895 1896
    virCapabilitiesFree(lxc_driver->caps);
    VIR_FREE(lxc_driver->configDir);
    VIR_FREE(lxc_driver->autostartDir);
    VIR_FREE(lxc_driver->stateDir);
    VIR_FREE(lxc_driver->logDir);
    lxcDriverUnlock(lxc_driver);
1897
    virMutexDestroy(&lxc_driver->lock);
1898
    VIR_FREE(lxc_driver);
1899 1900 1901

    return 0;
}
D
Daniel Veillard 已提交
1902

1903 1904 1905 1906 1907 1908 1909 1910 1911
/**
 * lxcActive:
 *
 * Checks if the LXC daemon is active, i.e. has an active domain
 *
 * Returns 1 if active, 0 otherwise
 */
static int
lxcActive(void) {
1912
    int active;
1913

1914 1915
    if (lxc_driver == NULL)
        return(0);
1916

1917
    lxcDriverLock(lxc_driver);
1918
    active = virDomainObjListNumOfDomains(&lxc_driver->domains, 1);
1919
    lxcDriverUnlock(lxc_driver);
1920

1921
    return active;
D
Daniel Veillard 已提交
1922 1923
}

1924
static int lxcVersion(virConnectPtr conn ATTRIBUTE_UNUSED, unsigned long *version)
D
Dan Smith 已提交
1925 1926 1927 1928 1929 1930
{
    struct utsname ver;
    int maj;
    int min;
    int rev;

1931
    uname(&ver);
D
Dan Smith 已提交
1932 1933

    if (sscanf(ver.release, "%i.%i.%i", &maj, &min, &rev) != 3) {
1934
        lxcError(VIR_ERR_INTERNAL_ERROR,
D
Dan Smith 已提交
1935 1936 1937 1938 1939 1940 1941 1942
                 _("Unknown release: %s"), ver.release);
        return -1;
    }

    *version = (maj * 1000 * 1000) + (min * 1000) + rev;

    return 0;
}
1943

1944 1945
static char *lxcGetSchedulerType(virDomainPtr domain ATTRIBUTE_UNUSED,
                                 int *nparams)
1946
{
1947 1948
    char *schedulerType = NULL;

1949 1950 1951
    if (nparams)
        *nparams = 1;

1952 1953 1954
    schedulerType = strdup("posix");

    if (schedulerType == NULL)
1955
        virReportOOMError();
1956 1957

    return schedulerType;
1958 1959
}

1960
static int lxcSetSchedulerParameters(virDomainPtr domain,
1961 1962 1963
                                     virSchedParameterPtr params,
                                     int nparams)
{
1964
    lxc_driver_t *driver = domain->conn->privateData;
1965
    int i;
1966 1967 1968
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;
1969

1970
    if (driver->cgroup == NULL)
1971 1972 1973 1974
        return -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
1975

1976
    if (vm == NULL) {
1977
        lxcError(VIR_ERR_INTERNAL_ERROR,
1978 1979
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
1980 1981
    }

1982
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
1983
        goto cleanup;
1984 1985 1986

    for (i = 0; i < nparams; i++) {
        virSchedParameterPtr param = &params[i];
1987
        if (param->type != VIR_DOMAIN_SCHED_FIELD_ULLONG) {
1988
            lxcError(VIR_ERR_INVALID_ARG, "%s",
1989
                     _("Invalid type for cpu_shares tunable, expected a 'ullong'"));
1990 1991
            goto cleanup;
        }
1992 1993

        if (STREQ(param->field, "cpu_shares")) {
1994
            if (virCgroupSetCpuShares(group, params[i].value.ul) != 0)
1995
                goto cleanup;
1996
        } else {
1997
            lxcError(VIR_ERR_INVALID_ARG,
1998
                     _("Invalid parameter `%s'"), param->field);
1999
            goto cleanup;
2000 2001
        }
    }
2002
    ret = 0;
2003

2004
cleanup:
2005
    lxcDriverUnlock(driver);
2006
    virCgroupFree(&group);
2007 2008
    if (vm)
        virDomainObjUnlock(vm);
2009
    return ret;
2010 2011
}

2012
static int lxcGetSchedulerParameters(virDomainPtr domain,
2013 2014 2015
                                     virSchedParameterPtr params,
                                     int *nparams)
{
2016
    lxc_driver_t *driver = domain->conn->privateData;
2017 2018
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
2019
    unsigned long long val;
2020
    int ret = -1;
2021

2022
    if (driver->cgroup == NULL)
2023
        return -1;
2024 2025

    if ((*nparams) != 1) {
2026
        lxcError(VIR_ERR_INVALID_ARG,
J
Jim Meyering 已提交
2027
                 "%s", _("Invalid parameter count"));
2028
        return -1;
2029 2030
    }

2031 2032 2033
    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);

2034
    if (vm == NULL) {
2035
        lxcError(VIR_ERR_INTERNAL_ERROR,
2036 2037
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
2038 2039
    }

2040
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
2041
        goto cleanup;
2042

2043 2044
    if (virCgroupGetCpuShares(group, &val) != 0)
        goto cleanup;
2045
    params[0].value.ul = val;
C
Chris Lalancette 已提交
2046
    if (virStrcpyStatic(params[0].field, "cpu_shares") == NULL) {
2047
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
2048 2049 2050
                 "%s", _("Field cpu_shares too big for destination"));
        goto cleanup;
    }
2051 2052
    params[0].type = VIR_DOMAIN_SCHED_FIELD_ULLONG;

2053
    ret = 0;
2054

2055
cleanup:
2056
    lxcDriverUnlock(driver);
2057
    virCgroupFree(&group);
2058 2059
    if (vm)
        virDomainObjUnlock(vm);
2060
    return ret;
2061 2062
}

2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080
#ifdef __linux__
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path,
                        struct _virDomainInterfaceStats *stats)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int i;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2081
        lxcError(VIR_ERR_NO_DOMAIN,
2082 2083 2084 2085 2086
                 _("No domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
2087
        lxcError(VIR_ERR_OPERATION_INVALID,
2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101
                 "%s", _("Domain is not running"));
        goto cleanup;
    }

    /* Check the path is one of the domain's network interfaces. */
    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (vm->def->nets[i]->ifname &&
            STREQ(vm->def->nets[i]->ifname, path)) {
            ret = 0;
            break;
        }
    }

    if (ret == 0)
2102
        ret = linuxDomainInterfaceStats(path, stats);
2103
    else
2104
        lxcError(VIR_ERR_INVALID_ARG,
2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116
                 _("Invalid path, '%s' is not a known interface"), path);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}
#else
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path ATTRIBUTE_UNUSED,
                        struct _virDomainInterfaceStats *stats ATTRIBUTE_UNUSED)
2117
    lxcError(VIR_ERR_NO_SUPPORT, "%s", __FUNCTION__);
2118 2119 2120 2121
    return -1;
}
#endif

2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134
static int lxcDomainGetAutostart(virDomainPtr dom,
                                   int *autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2135
        lxcError(VIR_ERR_NO_DOMAIN,
2136
                 _("No domain with matching uuid '%s'"), uuidstr);
2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161
        goto cleanup;
    }

    *autostart = vm->autostart;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetAutostart(virDomainPtr dom,
                                   int autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *configFile = NULL, *autostartLink = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2162
        lxcError(VIR_ERR_NO_DOMAIN,
2163
                 _("No domain with matching uuid '%s'"), uuidstr);
2164 2165 2166 2167
        goto cleanup;
    }

    if (!vm->persistent) {
2168
        lxcError(VIR_ERR_INTERNAL_ERROR,
2169
                 "%s", _("Cannot set autostart for transient domain"));
2170 2171 2172 2173 2174
        goto cleanup;
    }

    autostart = (autostart != 0);

2175 2176 2177 2178
    if (vm->autostart == autostart) {
        ret = 0;
        goto cleanup;
    }
2179

2180
    configFile = virDomainConfigFile(driver->configDir,
2181 2182 2183
                                     vm->def->name);
    if (configFile == NULL)
        goto cleanup;
2184
    autostartLink = virDomainConfigFile(driver->autostartDir,
2185 2186 2187
                                        vm->def->name);
    if (autostartLink == NULL)
        goto cleanup;
2188

2189 2190
    if (autostart) {
        int err;
2191

2192
        if ((err = virFileMakePath(driver->autostartDir))) {
2193
            virReportSystemError(err,
2194 2195 2196
                                 _("Cannot create autostart directory %s"),
                                 driver->autostartDir);
            goto cleanup;
2197 2198
        }

2199
        if (symlink(configFile, autostartLink) < 0) {
2200
            virReportSystemError(errno,
2201 2202 2203 2204 2205 2206
                                 _("Failed to create symlink '%s to '%s'"),
                                 autostartLink, configFile);
            goto cleanup;
        }
    } else {
        if (unlink(autostartLink) < 0 && errno != ENOENT && errno != ENOTDIR) {
2207
            virReportSystemError(errno,
2208 2209 2210 2211
                                 _("Failed to delete symlink '%s'"),
                                 autostartLink);
            goto cleanup;
        }
2212
    }
2213 2214

    vm->autostart = autostart;
2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225
    ret = 0;

cleanup:
    VIR_FREE(configFile);
    VIR_FREE(autostartLink);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

R
Ryota Ozaki 已提交
2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330
static int lxcFreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int timeout = 1000; /* In milliseconds */
    int check_interval = 1; /* In milliseconds */
    int exp = 10;
    int waited_time = 0;
    int ret = -1;
    char *state = NULL;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    while (waited_time < timeout) {
        int r;
        /*
         * Writing "FROZEN" to the "freezer.state" freezes the group,
         * i.e., the container, temporarily transiting "FREEZING" state.
         * Once the freezing is completed, the state of the group transits
         * to "FROZEN".
         * (see linux-2.6/Documentation/cgroups/freezer-subsystem.txt)
         */
        r = virCgroupSetFreezerState(cgroup, "FROZEN");

        /*
         * Returning EBUSY explicitly indicates that the group is
         * being freezed but incomplete and other errors are true
         * errors.
         */
        if (r < 0 && r != -EBUSY) {
            VIR_DEBUG("Writing freezer.state failed with errno: %d", r);
            goto error;
        }
        if (r == -EBUSY)
            VIR_DEBUG0("Writing freezer.state gets EBUSY");

        /*
         * Unfortunately, returning 0 (success) is likely to happen
         * even when the freezing has not been completed. Sometimes
         * the state of the group remains "FREEZING" like when
         * returning -EBUSY and even worse may never transit to
         * "FROZEN" even if writing "FROZEN" again.
         *
         * So we don't trust the return value anyway and always
         * decide that the freezing has been complete only with
         * the state actually transit to "FROZEN".
         */
        usleep(check_interval * 1000);

        r = virCgroupGetFreezerState(cgroup, &state);

        if (r < 0) {
            VIR_DEBUG("Reading freezer.state failed with errno: %d", r);
            goto error;
        }
        VIR_DEBUG("Read freezer.state: %s", state);

        if (STREQ(state, "FROZEN")) {
            ret = 0;
            goto cleanup;
        }

        waited_time += check_interval;
        /*
         * Increasing check_interval exponentially starting with
         * small initial value treats nicely two cases; One is
         * a container is under no load and waiting for long period
         * makes no sense. The other is under heavy load. The container
         * may stay longer time in FREEZING or never transit to FROZEN.
         * In that case, eager polling will just waste CPU time.
         */
        check_interval *= exp;
        VIR_FREE(state);
    }
    VIR_DEBUG0("lxcFreezeContainer timeout");
error:
    /*
     * If timeout or an error on reading the state occurs,
     * activate the group again and return an error.
     * This is likely to fall the group back again gracefully.
     */
    virCgroupSetFreezerState(cgroup, "THAWED");
    ret = -1;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);
    VIR_FREE(state);
    return ret;
}

static int lxcDomainSuspend(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2331
        lxcError(VIR_ERR_NO_DOMAIN,
2332
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2333 2334 2335
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2336
    if (!virDomainObjIsActive(vm)) {
2337
        lxcError(VIR_ERR_OPERATION_INVALID,
2338
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2339 2340 2341 2342 2343
        goto cleanup;
    }

    if (vm->state != VIR_DOMAIN_PAUSED) {
        if (lxcFreezeContainer(driver, vm) < 0) {
2344
            lxcError(VIR_ERR_OPERATION_FAILED,
2345
                     "%s", _("Suspend operation failed"));
R
Ryota Ozaki 已提交
2346 2347 2348 2349 2350 2351 2352 2353 2354
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_PAUSED;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
    }

2355
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

static int lxcUnfreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int ret;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    ret = virCgroupSetFreezerState(cgroup, "THAWED");

    virCgroupFree(&cgroup);
    return ret;
}

static int lxcDomainResume(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2396
        lxcError(VIR_ERR_NO_DOMAIN,
2397
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2398 2399 2400
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2401
    if (!virDomainObjIsActive(vm)) {
2402
        lxcError(VIR_ERR_OPERATION_INVALID,
2403
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2404 2405 2406 2407 2408
        goto cleanup;
    }

    if (vm->state == VIR_DOMAIN_PAUSED) {
        if (lxcUnfreezeContainer(driver, vm) < 0) {
2409
            lxcError(VIR_ERR_OPERATION_FAILED,
2410
                     "%s", _("Resume operation failed"));
R
Ryota Ozaki 已提交
2411 2412 2413 2414 2415 2416 2417 2418 2419
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_RUNNING;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_UNPAUSED);
    }

2420
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}


D
Daniel Veillard 已提交
2434 2435 2436 2437 2438 2439 2440 2441
/* Function Tables */
static virDriver lxcDriver = {
    VIR_DRV_LXC, /* the number virDrvNo */
    "LXC", /* the name of the driver */
    lxcOpen, /* open */
    lxcClose, /* close */
    NULL, /* supports_feature */
    NULL, /* type */
D
Dan Smith 已提交
2442
    lxcVersion, /* version */
2443
    NULL, /* libvirtVersion (impl. in libvirt.c) */
2444
    virGetHostname, /* getHostname */
D
Daniel Veillard 已提交
2445
    NULL, /* getMaxVcpus */
2446 2447
    nodeGetInfo, /* nodeGetInfo */
    lxcGetCapabilities, /* getCapabilities */
D
Daniel Veillard 已提交
2448 2449
    lxcListDomains, /* listDomains */
    lxcNumDomains, /* numOfDomains */
2450
    lxcDomainCreateAndStart, /* domainCreateXML */
D
Daniel Veillard 已提交
2451 2452 2453
    lxcDomainLookupByID, /* domainLookupByID */
    lxcDomainLookupByUUID, /* domainLookupByUUID */
    lxcDomainLookupByName, /* domainLookupByName */
R
Ryota Ozaki 已提交
2454 2455
    lxcDomainSuspend, /* domainSuspend */
    lxcDomainResume, /* domainResume */
2456
    lxcDomainShutdown, /* domainShutdown */
D
Daniel Veillard 已提交
2457
    NULL, /* domainReboot */
2458
    lxcDomainDestroy, /* domainDestroy */
D
Daniel Veillard 已提交
2459
    lxcGetOSType, /* domainGetOSType */
R
Ryota Ozaki 已提交
2460 2461 2462
    lxcDomainGetMaxMemory, /* domainGetMaxMemory */
    lxcDomainSetMaxMemory, /* domainSetMaxMemory */
    lxcDomainSetMemory, /* domainSetMemory */
D
Daniel Veillard 已提交
2463 2464 2465 2466 2467 2468 2469 2470
    lxcDomainGetInfo, /* domainGetInfo */
    NULL, /* domainSave */
    NULL, /* domainRestore */
    NULL, /* domainCoreDump */
    NULL, /* domainSetVcpus */
    NULL, /* domainPinVcpu */
    NULL, /* domainGetVcpus */
    NULL, /* domainGetMaxVcpus */
2471 2472
    NULL, /* domainGetSecurityLabel */
    NULL, /* nodeGetSecurityModel */
D
Daniel Veillard 已提交
2473
    lxcDomainDumpXML, /* domainDumpXML */
2474 2475
    NULL, /* domainXMLFromNative */
    NULL, /* domainXMLToNative */
D
Daniel Veillard 已提交
2476 2477
    lxcListDefinedDomains, /* listDefinedDomains */
    lxcNumDefinedDomains, /* numOfDefinedDomains */
2478
    lxcDomainStart, /* domainCreate */
D
Daniel Veillard 已提交
2479 2480 2481
    lxcDomainDefine, /* domainDefineXML */
    lxcDomainUndefine, /* domainUndefine */
    NULL, /* domainAttachDevice */
2482
    NULL, /* domainAttachDeviceFlags */
D
Daniel Veillard 已提交
2483
    NULL, /* domainDetachDevice */
2484
    NULL, /* domainDetachDeviceFlags */
2485
    NULL, /* domainUpdateDeviceFlags */
2486 2487
    lxcDomainGetAutostart, /* domainGetAutostart */
    lxcDomainSetAutostart, /* domainSetAutostart */
2488 2489 2490
    lxcGetSchedulerType, /* domainGetSchedulerType */
    lxcGetSchedulerParameters, /* domainGetSchedulerParameters */
    lxcSetSchedulerParameters, /* domainSetSchedulerParameters */
D
Daniel Veillard 已提交
2491 2492 2493 2494
    NULL, /* domainMigratePrepare */
    NULL, /* domainMigratePerform */
    NULL, /* domainMigrateFinish */
    NULL, /* domainBlockStats */
2495
    lxcDomainInterfaceStats, /* domainInterfaceStats */
2496
    NULL, /* domainMemoryStats */
D
Daniel P. Berrange 已提交
2497 2498
    NULL, /* domainBlockPeek */
    NULL, /* domainMemoryPeek */
2499 2500
    nodeGetCellsFreeMemory, /* nodeGetCellsFreeMemory */
    nodeGetFreeMemory,  /* getFreeMemory */
2501 2502
    lxcDomainEventRegister, /* domainEventRegister */
    lxcDomainEventDeregister, /* domainEventDeregister */
D
Daniel Veillard 已提交
2503 2504
    NULL, /* domainMigratePrepare2 */
    NULL, /* domainMigrateFinish2 */
2505
    NULL, /* nodeDeviceDettach */
2506 2507
    NULL, /* nodeDeviceReAttach */
    NULL, /* nodeDeviceReset */
C
Chris Lalancette 已提交
2508
    NULL, /* domainMigratePrepareTunnel */
2509 2510 2511 2512
    lxcIsEncrypted,
    lxcIsSecure,
    lxcDomainIsActive,
    lxcDomainIsPersistent,
J
Jiri Denemark 已提交
2513
    NULL, /* cpuCompare */
2514
    NULL, /* cpuBaseline */
2515
    NULL, /* domainGetJobInfo */
2516
    NULL, /* domainAbortJob */
2517
    NULL, /* domainMigrateSetMaxDowntime */
2518 2519
    lxcDomainEventRegisterAny, /* domainEventRegisterAny */
    lxcDomainEventDeregisterAny, /* domainEventDeregisterAny */
D
Daniel Veillard 已提交
2520 2521
};

2522
static virStateDriver lxcStateDriver = {
2523
    .name = "LXC",
2524 2525 2526
    .initialize = lxcStartup,
    .cleanup = lxcShutdown,
    .active = lxcActive,
2527
    .reload = lxcReload,
2528 2529
};

D
Daniel Veillard 已提交
2530 2531 2532
int lxcRegister(void)
{
    virRegisterDriver(&lxcDriver);
2533
    virRegisterStateDriver(&lxcStateDriver);
D
Daniel Veillard 已提交
2534 2535
    return 0;
}