lxc_driver.c 67.4 KB
Newer Older
D
Daniel Veillard 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright IBM Corp. 2008
 *
 * lxc_driver.c: linux container driver functions
 *
 * Authors:
 *  David L. Leskovec <dlesko at linux.vnet.ibm.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 */

#include <config.h>

26
#include <fcntl.h>
D
Daniel Veillard 已提交
27 28
#include <sched.h>
#include <sys/utsname.h>
D
David L. Leskovec 已提交
29
#include <stdbool.h>
D
Daniel Veillard 已提交
30 31
#include <string.h>
#include <sys/types.h>
32 33 34
#include <sys/socket.h>
#include <sys/un.h>
#include <sys/poll.h>
D
Daniel Veillard 已提交
35 36 37
#include <unistd.h>
#include <wait.h>

38
#include "virterror_internal.h"
39
#include "logging.h"
40
#include "datatypes.h"
D
Daniel Veillard 已提交
41
#include "lxc_conf.h"
42
#include "lxc_container.h"
D
Daniel Veillard 已提交
43
#include "lxc_driver.h"
44
#include "memory.h"
45
#include "util.h"
46 47
#include "bridge.h"
#include "veth.h"
48
#include "event.h"
49
#include "nodeinfo.h"
50
#include "uuid.h"
51
#include "stats_linux.h"
52

D
Daniel Veillard 已提交
53

54 55
#define VIR_FROM_THIS VIR_FROM_LXC

56 57 58 59 60 61 62 63
typedef struct _lxcDomainObjPrivate lxcDomainObjPrivate;
typedef lxcDomainObjPrivate *lxcDomainObjPrivatePtr;
struct _lxcDomainObjPrivate {
    int monitor;
    int monitorWatch;
};


64
static int lxcStartup(int privileged);
65
static int lxcShutdown(void);
66
static lxc_driver_t *lxc_driver = NULL;
D
Daniel Veillard 已提交
67 68 69

/* Functions */

70 71
static void lxcDriverLock(lxc_driver_t *driver)
{
72
    virMutexLock(&driver->lock);
73 74 75
}
static void lxcDriverUnlock(lxc_driver_t *driver)
{
76
    virMutexUnlock(&driver->lock);
77 78
}

79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
static void *lxcDomainObjPrivateAlloc(void)
{
    lxcDomainObjPrivatePtr priv;

    if (VIR_ALLOC(priv) < 0)
        return NULL;

    priv->monitor = -1;
    priv->monitorWatch = -1;

    return priv;
}

static void lxcDomainObjPrivateFree(void *data)
{
    lxcDomainObjPrivatePtr priv = data;

    VIR_FREE(priv);
}


100 101 102 103
static void lxcDomainEventFlush(int timer, void *opaque);
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                virDomainEventPtr event);

104

D
Daniel Veillard 已提交
105 106 107 108 109
static virDrvOpenStatus lxcOpen(virConnectPtr conn,
                                virConnectAuthPtr auth ATTRIBUTE_UNUSED,
                                int flags ATTRIBUTE_UNUSED)
{
    /* Verify uri was specified */
110
    if (conn->uri == NULL) {
111 112
        if (lxc_driver == NULL)
            return VIR_DRV_OPEN_DECLINED;
113

114 115
        conn->uri = xmlParseURI("lxc:///");
        if (!conn->uri) {
116
            virReportOOMError();
117 118
            return VIR_DRV_OPEN_ERROR;
        }
119 120 121 122 123 124 125 126 127 128 129
    } else {
        if (conn->uri->scheme == NULL ||
            STRNEQ(conn->uri->scheme, "lxc"))
            return VIR_DRV_OPEN_DECLINED;

        /* Leave for remote driver */
        if (conn->uri->server != NULL)
            return VIR_DRV_OPEN_DECLINED;

        /* If path isn't '/' then they typoed, tell them correct path */
        if (STRNEQ(conn->uri->path, "/")) {
130
            lxcError(VIR_ERR_INTERNAL_ERROR,
131
                     _("Unexpected LXC URI path '%s', try lxc:///"),
132 133 134
                     conn->uri->path);
            return VIR_DRV_OPEN_ERROR;
        }
D
Daniel Veillard 已提交
135

136 137
        /* URI was good, but driver isn't active */
        if (lxc_driver == NULL) {
138
            lxcError(VIR_ERR_INTERNAL_ERROR,
139
                     "%s", _("lxc state driver is not active"));
140 141 142
            return VIR_DRV_OPEN_ERROR;
        }
    }
143

144
    conn->privateData = lxc_driver;
D
Daniel Veillard 已提交
145 146 147 148 149 150

    return VIR_DRV_OPEN_SUCCESS;
}

static int lxcClose(virConnectPtr conn)
{
151 152 153 154 155 156
    lxc_driver_t *driver = conn->privateData;

    lxcDriverLock(driver);
    virDomainEventCallbackListRemoveConn(conn, driver->domainEventCallbacks);
    lxcDriverUnlock(driver);

157 158
    conn->privateData = NULL;
    return 0;
D
Daniel Veillard 已提交
159 160
}

161 162 163 164 165 166 167 168 169 170 171 172 173 174 175

static int lxcIsSecure(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Trivially secure, since always inside the daemon */
    return 1;
}


static int lxcIsEncrypted(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Not encrypted, but remote driver takes care of that */
    return 0;
}


176 177 178 179 180 181
static char *lxcGetCapabilities(virConnectPtr conn) {
    lxc_driver_t *driver = conn->privateData;
    char *xml;

    lxcDriverLock(driver);
    if ((xml = virCapabilitiesFormatXML(driver->caps)) == NULL)
182
        virReportOOMError();
183 184 185 186 187 188
    lxcDriverUnlock(driver);

    return xml;
}


D
Daniel Veillard 已提交
189 190 191
static virDomainPtr lxcDomainLookupByID(virConnectPtr conn,
                                        int id)
{
192 193 194
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
195

196
    lxcDriverLock(driver);
197
    vm = virDomainFindByID(&driver->domains, id);
198 199
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
200
    if (!vm) {
201
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
202
        goto cleanup;
D
Daniel Veillard 已提交
203 204 205
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
206
    if (dom)
D
Daniel Veillard 已提交
207 208
        dom->id = vm->def->id;

209
cleanup:
210 211
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
212 213 214 215 216 217
    return dom;
}

static virDomainPtr lxcDomainLookupByUUID(virConnectPtr conn,
                                          const unsigned char *uuid)
{
218 219 220
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
221

222
    lxcDriverLock(driver);
223
    vm = virDomainFindByUUID(&driver->domains, uuid);
224 225
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
226
    if (!vm) {
227
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
228
        goto cleanup;
D
Daniel Veillard 已提交
229 230 231
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
232
    if (dom)
D
Daniel Veillard 已提交
233 234
        dom->id = vm->def->id;

235
cleanup:
236 237
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
238 239 240 241 242 243
    return dom;
}

static virDomainPtr lxcDomainLookupByName(virConnectPtr conn,
                                          const char *name)
{
244 245 246
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
247

248
    lxcDriverLock(driver);
249
    vm = virDomainFindByName(&driver->domains, name);
250
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
251
    if (!vm) {
252
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
253
        goto cleanup;
D
Daniel Veillard 已提交
254 255 256
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
257
    if (dom)
D
Daniel Veillard 已提交
258 259
        dom->id = vm->def->id;

260
cleanup:
261 262
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
263 264 265
    return dom;
}

266 267 268 269 270 271 272 273 274 275 276

static int lxcDomainIsActive(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
277
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298
        goto cleanup;
    }
    ret = virDomainObjIsActive(obj);

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


static int lxcDomainIsPersistent(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
299
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
300 301 302 303 304 305 306 307 308 309 310
        goto cleanup;
    }
    ret = obj->persistent;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


311
static int lxcListDomains(virConnectPtr conn, int *ids, int nids) {
312
    lxc_driver_t *driver = conn->privateData;
313
    int n;
314

315
    lxcDriverLock(driver);
316
    n = virDomainObjListGetActiveIDs(&driver->domains, ids, nids);
317
    lxcDriverUnlock(driver);
318

319
    return n;
D
Daniel Veillard 已提交
320
}
321

322
static int lxcNumDomains(virConnectPtr conn) {
323
    lxc_driver_t *driver = conn->privateData;
324
    int n;
325

326
    lxcDriverLock(driver);
327
    n = virDomainObjListNumOfDomains(&driver->domains, 1);
328
    lxcDriverUnlock(driver);
329

330
    return n;
D
Daniel Veillard 已提交
331 332 333
}

static int lxcListDefinedDomains(virConnectPtr conn,
334
                                 char **const names, int nnames) {
335
    lxc_driver_t *driver = conn->privateData;
336
    int n;
337

338
    lxcDriverLock(driver);
339
    n = virDomainObjListGetInactiveNames(&driver->domains, names, nnames);
340
    lxcDriverUnlock(driver);
341

342
    return n;
D
Daniel Veillard 已提交
343 344 345
}


346
static int lxcNumDefinedDomains(virConnectPtr conn) {
347
    lxc_driver_t *driver = conn->privateData;
348
    int n;
349

350
    lxcDriverLock(driver);
351
    n = virDomainObjListNumOfDomains(&driver->domains, 0);
352
    lxcDriverUnlock(driver);
353

354
    return n;
D
Daniel Veillard 已提交
355 356
}

357 358


D
Daniel Veillard 已提交
359 360
static virDomainPtr lxcDomainDefine(virConnectPtr conn, const char *xml)
{
361 362
    lxc_driver_t *driver = conn->privateData;
    virDomainDefPtr def = NULL;
363
    virDomainObjPtr vm = NULL;
364
    virDomainPtr dom = NULL;
365
    virDomainEventPtr event = NULL;
366
    int dupVM;
D
Daniel Veillard 已提交
367

368
    lxcDriverLock(driver);
369
    if (!(def = virDomainDefParseString(driver->caps, xml,
370
                                        VIR_DOMAIN_XML_INACTIVE)))
371
        goto cleanup;
D
Daniel Veillard 已提交
372

373 374
   if ((dupVM = virDomainObjIsDuplicate(&driver->domains, def, 0)) < 0)
        goto cleanup;
375

376
    if ((def->nets != NULL) && !(driver->have_netns)) {
377
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
378
                 "%s", _("System lacks NETNS support"));
379
        goto cleanup;
380 381
    }

382
    if (!(vm = virDomainAssignDef(driver->caps,
383
                                  &driver->domains, def)))
384 385
        goto cleanup;
    def = NULL;
386
    vm->persistent = 1;
D
Daniel Veillard 已提交
387

388
    if (virDomainSaveConfig(driver->configDir,
389
                            vm->newDef ? vm->newDef : vm->def) < 0) {
390
        virDomainRemoveInactive(&driver->domains, vm);
391
        vm = NULL;
392
        goto cleanup;
D
Daniel Veillard 已提交
393 394
    }

395 396
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
397
                                     !dupVM ?
398 399 400
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                     VIR_DOMAIN_EVENT_DEFINED_UPDATED);

D
Daniel Veillard 已提交
401
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
402
    if (dom)
D
Daniel Veillard 已提交
403 404
        dom->id = vm->def->id;

405 406
cleanup:
    virDomainDefFree(def);
407 408
    if (vm)
        virDomainObjUnlock(vm);
409 410
    if (event)
        lxcDomainEventQueue(driver, event);
411
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
412 413 414 415 416
    return dom;
}

static int lxcDomainUndefine(virDomainPtr dom)
{
417 418
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
419
    virDomainEventPtr event = NULL;
420
    int ret = -1;
D
Daniel Veillard 已提交
421

422
    lxcDriverLock(driver);
423
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel Veillard 已提交
424
    if (!vm) {
425
        lxcError(VIR_ERR_INVALID_DOMAIN,
426
                 "%s", _("No domain with matching uuid"));
427
        goto cleanup;
D
Daniel Veillard 已提交
428 429
    }

D
Daniel P. Berrange 已提交
430
    if (virDomainObjIsActive(vm)) {
431
        lxcError(VIR_ERR_OPERATION_INVALID,
432
                 "%s", _("Cannot delete active domain"));
433
        goto cleanup;
D
Daniel Veillard 已提交
434 435
    }

436
    if (!vm->persistent) {
437
        lxcError(VIR_ERR_OPERATION_INVALID,
438
                 "%s", _("Cannot undefine transient domain"));
439
        goto cleanup;
440
    }
D
Daniel Veillard 已提交
441

442
    if (virDomainDeleteConfig(driver->configDir,
443
                              driver->autostartDir,
444 445
                              vm) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
446

447 448 449 450
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_UNDEFINED,
                                     VIR_DOMAIN_EVENT_UNDEFINED_REMOVED);

451
    virDomainRemoveInactive(&driver->domains, vm);
452
    vm = NULL;
453
    ret = 0;
D
Daniel Veillard 已提交
454

455
cleanup:
456 457
    if (vm)
        virDomainObjUnlock(vm);
458 459
    if (event)
        lxcDomainEventQueue(driver, event);
460
    lxcDriverUnlock(driver);
461
    return ret;
D
Daniel Veillard 已提交
462 463 464 465 466
}

static int lxcDomainGetInfo(virDomainPtr dom,
                            virDomainInfoPtr info)
{
467 468
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
469
    virCgroupPtr cgroup = NULL;
470
    int ret = -1;
D
Daniel Veillard 已提交
471

472
    lxcDriverLock(driver);
473
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
474

D
Daniel Veillard 已提交
475
    if (!vm) {
476
        lxcError(VIR_ERR_INVALID_DOMAIN,
477
                 "%s", _("No domain with matching uuid"));
478
        goto cleanup;
D
Daniel Veillard 已提交
479 480 481 482
    }

    info->state = vm->state;

D
Daniel P. Berrange 已提交
483
    if (!virDomainObjIsActive(vm) || driver->cgroup == NULL) {
D
Daniel Veillard 已提交
484
        info->cpuTime = 0;
R
Ryota Ozaki 已提交
485
        info->memory = vm->def->memory;
D
Daniel Veillard 已提交
486
    } else {
487
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
488
            lxcError(VIR_ERR_INTERNAL_ERROR,
489
                     _("Unable to get cgroup for %s"), vm->def->name);
490 491 492 493
            goto cleanup;
        }

        if (virCgroupGetCpuacctUsage(cgroup, &(info->cpuTime)) < 0) {
494
            lxcError(VIR_ERR_OPERATION_FAILED,
495
                     "%s", _("Cannot read cputime for domain"));
R
Ryota Ozaki 已提交
496 497 498
            goto cleanup;
        }
        if (virCgroupGetMemoryUsage(cgroup, &(info->memory)) < 0) {
499
            lxcError(VIR_ERR_OPERATION_FAILED,
500
                     "%s", _("Cannot read memory usage for domain"));
501 502
            goto cleanup;
        }
D
Daniel Veillard 已提交
503 504
    }

505
    info->maxMem = vm->def->maxmem;
D
Daniel Veillard 已提交
506
    info->nrVirtCpu = 1;
507
    ret = 0;
D
Daniel Veillard 已提交
508

509
cleanup:
510
    lxcDriverUnlock(driver);
511 512
    if (cgroup)
        virCgroupFree(&cgroup);
513 514
    if (vm)
        virDomainObjUnlock(vm);
515
    return ret;
D
Daniel Veillard 已提交
516 517
}

518
static char *lxcGetOSType(virDomainPtr dom)
D
Daniel Veillard 已提交
519
{
520 521 522
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
523

524
    lxcDriverLock(driver);
525
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
526 527
    lxcDriverUnlock(driver);

528
    if (!vm) {
529
        lxcError(VIR_ERR_INVALID_DOMAIN,
530
                 "%s", _("No domain with matching uuid"));
531
        goto cleanup;
532 533
    }

534 535
    ret = strdup(vm->def->os.type);

536
    if (ret == NULL)
537
        virReportOOMError();
538

539
cleanup:
540 541
    if (vm)
        virDomainObjUnlock(vm);
542
    return ret;
D
Daniel Veillard 已提交
543 544
}

R
Ryota Ozaki 已提交
545 546 547 548 549 550 551 552 553 554 555 556 557
/* Returns max memory in kb, 0 if error */
static unsigned long lxcDomainGetMaxMemory(virDomainPtr dom) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned long ret = 0;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
558
        lxcError(VIR_ERR_NO_DOMAIN,
559
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582
        goto cleanup;
    }

    ret = vm->def->maxmem;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMaxMemory(virDomainPtr dom, unsigned long newmax) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
583
        lxcError(VIR_ERR_NO_DOMAIN,
584
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
585 586 587 588
        goto cleanup;
    }

    if (newmax < vm->def->memory) {
589
        lxcError(VIR_ERR_INVALID_ARG,
590
                         "%s", _("Cannot set max memory lower than current memory"));
R
Ryota Ozaki 已提交
591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614
        goto cleanup;
    }

    vm->def->maxmem = newmax;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMemory(virDomainPtr dom, unsigned long newmem) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virCgroupPtr cgroup = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
615
        lxcError(VIR_ERR_NO_DOMAIN,
616
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
617 618 619 620
        goto cleanup;
    }

    if (newmem > vm->def->maxmem) {
621
        lxcError(VIR_ERR_INVALID_ARG,
622
                 "%s", _("Cannot set memory higher than max memory"));
R
Ryota Ozaki 已提交
623 624 625
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
626
    if (virDomainObjIsActive(vm)) {
R
Ryota Ozaki 已提交
627
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
628
            lxcError(VIR_ERR_INTERNAL_ERROR,
R
Ryota Ozaki 已提交
629 630 631 632 633
                     _("Unable to get cgroup for %s\n"), vm->def->name);
            goto cleanup;
        }

        if (virCgroupSetMemory(cgroup, newmem) < 0) {
634
            lxcError(VIR_ERR_OPERATION_FAILED,
635
                     "%s", _("Failed to set memory for domain"));
R
Ryota Ozaki 已提交
636 637 638 639 640 641 642 643 644 645 646 647 648 649 650
            goto cleanup;
        }
    } else {
        vm->def->memory = newmem;
    }
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    if (cgroup)
        virCgroupFree(&cgroup);
    return ret;
}

D
Daniel Veillard 已提交
651
static char *lxcDomainDumpXML(virDomainPtr dom,
652
                              int flags)
D
Daniel Veillard 已提交
653
{
654 655 656
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
D
Daniel Veillard 已提交
657

658
    lxcDriverLock(driver);
659
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
660 661
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
662
    if (!vm) {
663
        lxcError(VIR_ERR_INVALID_DOMAIN,
664
                 "%s", _("No domain with matching uuid"));
665
        goto cleanup;
D
Daniel Veillard 已提交
666 667
    }

668
    ret = virDomainDefFormat((flags & VIR_DOMAIN_XML_INACTIVE) &&
669 670 671 672
                             vm->newDef ? vm->newDef : vm->def,
                             flags);

cleanup:
673 674
    if (vm)
        virDomainObjUnlock(vm);
675
    return ret;
D
Daniel Veillard 已提交
676 677
}

678 679 680

/**
 * lxcVmCleanup:
681 682 683
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to VM to clean up
684 685 686 687 688 689 690
 *
 * waitpid() on the container process.  kill and wait the tty process
 * This is called by both lxcDomainDestroy and lxcSigHandler when a
 * container exits.
 *
 * Returns 0 on success or -1 in case of error
 */
691
static int lxcVmCleanup(lxc_driver_t *driver,
692
                        virDomainObjPtr  vm)
693 694 695 696
{
    int rc = -1;
    int waitRc;
    int childStatus = -1;
D
Dan Smith 已提交
697
    virCgroupPtr cgroup;
698
    int i;
699
    lxcDomainObjPrivatePtr priv = vm->privateData;
700 701 702 703 704 705

    while (((waitRc = waitpid(vm->pid, &childStatus, 0)) == -1) &&
           errno == EINTR)
        ; /* empty */

    if ((waitRc != vm->pid) && (errno != ECHILD)) {
706
        virReportSystemError(errno,
707 708
                             _("waitpid failed to wait for container %d: %d"),
                             vm->pid, waitRc);
709 710 711 712 713 714 715 716 717
    }

    rc = 0;

    if (WIFEXITED(childStatus)) {
        rc = WEXITSTATUS(childStatus);
        DEBUG("container exited with rc: %d", rc);
    }

718 719
    virEventRemoveHandle(priv->monitorWatch);
    close(priv->monitor);
720 721

    virFileDeletePid(driver->stateDir, vm->def->name);
722
    virDomainDeleteConfig(driver->stateDir, NULL, vm);
723 724 725 726

    vm->state = VIR_DOMAIN_SHUTOFF;
    vm->pid = -1;
    vm->def->id = -1;
727 728
    priv->monitor = -1;
    priv->monitorWatch = -1;
729

730 731 732
    for (i = 0 ; i < vm->def->nnets ; i++) {
        vethInterfaceUpOrDown(vm->def->nets[i]->ifname, 0);
        vethDelete(vm->def->nets[i]->ifname);
733 734
    }

735 736
    if (driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0) {
D
Dan Smith 已提交
737 738 739 740
        virCgroupRemove(cgroup);
        virCgroupFree(&cgroup);
    }

741 742 743 744 745 746 747
    if (vm->newDef) {
        virDomainDefFree(vm->def);
        vm->def = vm->newDef;
        vm->def->id = -1;
        vm->newDef = NULL;
    }

748 749 750
    return rc;
}

751 752
/**
 * lxcSetupInterfaces:
753
 * @conn: pointer to connection
754
 * @def: pointer to virtual machine structure
755 756
 * @nveths: number of interfaces
 * @veths: interface names
757 758 759 760 761 762 763 764
 *
 * Sets up the container interfaces by creating the veth device pairs and
 * attaching the parent end to the appropriate bridge.  The container end
 * will moved into the container namespace later after clone has been called.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcSetupInterfaces(virConnectPtr conn,
765
                              virDomainDefPtr def,
766 767
                              unsigned int *nveths,
                              char ***veths)
768
{
769
    int rc = -1, i;
770
    char *bridge = NULL;
771 772
    char parentVeth[PATH_MAX] = "";
    char containerVeth[PATH_MAX] = "";
773
    brControl *brctl = NULL;
774

775
    if (brInit(&brctl) != 0)
776 777
        return -1;

778 779
    for (i = 0 ; i < def->nnets ; i++) {
        switch (def->nets[i]->type) {
780 781 782
        case VIR_DOMAIN_NET_TYPE_NETWORK:
        {
            virNetworkPtr network = virNetworkLookupByName(conn,
783
                                                           def->nets[i]->data.network.name);
784 785 786 787 788 789 790
            if (!network) {
                goto error_exit;
            }

            bridge = virNetworkGetBridgeName(network);

            virNetworkFree(network);
791 792 793
            break;
        }
        case VIR_DOMAIN_NET_TYPE_BRIDGE:
794
            bridge = def->nets[i]->data.bridge.brname;
795
            break;
796 797 798 799
        }

        DEBUG("bridge: %s", bridge);
        if (NULL == bridge) {
800
            lxcError(VIR_ERR_INTERNAL_ERROR,
801
                     "%s", _("Failed to get bridge for interface"));
802 803 804 805
            goto error_exit;
        }

        DEBUG0("calling vethCreate()");
806 807
        if (NULL != def->nets[i]->ifname) {
            strcpy(parentVeth, def->nets[i]->ifname);
808 809 810
        }
        DEBUG("parentVeth: %s, containerVeth: %s", parentVeth, containerVeth);
        if (0 != (rc = vethCreate(parentVeth, PATH_MAX, containerVeth, PATH_MAX))) {
811
            lxcError(VIR_ERR_INTERNAL_ERROR,
812
                     _("Failed to create veth device pair: %d"), rc);
813 814
            goto error_exit;
        }
815 816
        if (NULL == def->nets[i]->ifname) {
            def->nets[i]->ifname = strdup(parentVeth);
817
        }
818
        if (VIR_REALLOC_N(*veths, (*nveths)+1) < 0) {
819
            virReportOOMError();
820
            goto error_exit;
821 822
        }
        if (((*veths)[(*nveths)] = strdup(containerVeth)) == NULL) {
823
            virReportOOMError();
824
            goto error_exit;
825 826
        }
        (*nveths)++;
827

828
        if (NULL == def->nets[i]->ifname) {
829
            virReportOOMError();
830 831 832
            goto error_exit;
        }

833
        {
834 835 836
            char macaddr[VIR_MAC_STRING_BUFLEN];
            virFormatMacAddr(def->nets[i]->mac, macaddr);
            if (0 != (rc = setMacAddr(containerVeth, macaddr))) {
837
                virReportSystemError(rc,
838
                                     _("Failed to set %s to %s"),
839 840 841 842 843
                                     macaddr, containerVeth);
                goto error_exit;
            }
        }

844
        if (0 != (rc = brAddInterface(brctl, bridge, parentVeth))) {
845
            virReportSystemError(rc,
846
                                 _("Failed to add %s device to %s"),
847
                                 parentVeth, bridge);
848 849 850 851
            goto error_exit;
        }

        if (0 != (rc = vethInterfaceUpOrDown(parentVeth, 1))) {
852
            virReportSystemError(rc,
853 854
                                 _("Failed to enable %s device"),
                                 parentVeth);
855 856 857 858 859 860 861 862
            goto error_exit;
        }

    }

    rc = 0;

error_exit:
863
    brShutdown(brctl);
864 865 866
    return rc;
}

867

868
static int lxcMonitorClient(lxc_driver_t * driver,
869
                            virDomainObjPtr vm)
870
{
871 872 873
    char *sockpath = NULL;
    int fd;
    struct sockaddr_un addr;
874

875 876
    if (virAsprintf(&sockpath, "%s/%s.sock",
                    driver->stateDir, vm->def->name) < 0) {
877
        virReportOOMError();
878 879 880 881
        return -1;
    }

    if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
882
        virReportSystemError(errno, "%s",
883
                             _("Failed to create client socket"));
884
        goto error;
885 886
    }

887 888
    memset(&addr, 0, sizeof(addr));
    addr.sun_family = AF_UNIX;
C
Chris Lalancette 已提交
889
    if (virStrcpyStatic(addr.sun_path, sockpath) == NULL) {
890
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
891 892 893
                 _("Socket path %s too big for destination"), sockpath);
        goto error;
    }
894 895

    if (connect(fd, (struct sockaddr *) &addr, sizeof(addr)) < 0) {
896
        virReportSystemError(errno, "%s",
897
                             _("Failed to connect to client socket"));
898
        goto error;
899 900
    }

901 902
    VIR_FREE(sockpath);
    return fd;
903

904 905 906 907 908 909 910 911
error:
    VIR_FREE(sockpath);
    if (fd != -1)
        close(fd);
    return -1;
}


912
static int lxcVmTerminate(lxc_driver_t *driver,
913
                          virDomainObjPtr vm,
914 915 916 917
                          int signum)
{
    if (signum == 0)
        signum = SIGINT;
918

919
    if (vm->pid <= 0) {
920
        lxcError(VIR_ERR_INTERNAL_ERROR,
921
                 _("Invalid PID %d for container"), vm->pid);
922 923 924
        return -1;
    }

925 926
    if (kill(vm->pid, signum) < 0) {
        if (errno != ESRCH) {
927
            virReportSystemError(errno,
928
                                 _("Failed to kill pid %d"),
929
                                 vm->pid);
930
            return -1;
931
        }
932 933
    }

934
    vm->state = VIR_DOMAIN_SHUTDOWN;
935

936
    return lxcVmCleanup(driver, vm);
937
}
938

939 940
static void lxcMonitorEvent(int watch,
                            int fd,
941 942 943
                            int events ATTRIBUTE_UNUSED,
                            void *data)
{
944 945
    lxc_driver_t *driver = lxc_driver;
    virDomainObjPtr vm = data;
946
    virDomainEventPtr event = NULL;
947
    lxcDomainObjPrivatePtr priv;
948

949
    lxcDriverLock(driver);
950 951
    virDomainObjLock(vm);
    lxcDriverUnlock(driver);
952

953 954 955
    priv = vm->privateData;

    if (priv->monitor != fd || priv->monitorWatch != watch) {
956
        virEventRemoveHandle(watch);
957
        goto cleanup;
958 959
    }

960
    if (lxcVmTerminate(driver, vm, SIGINT) < 0) {
961
        virEventRemoveHandle(watch);
962 963 964 965 966
    } else {
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
    }
967 968 969 970
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
971 972

cleanup:
973 974
    if (vm)
        virDomainObjUnlock(vm);
975 976
    if (event) {
        lxcDriverLock(driver);
977
        lxcDomainEventQueue(driver, event);
978 979
        lxcDriverUnlock(driver);
    }
980 981 982
}


983
static int lxcControllerStart(lxc_driver_t *driver,
984 985 986 987 988 989 990 991 992 993
                              virDomainObjPtr vm,
                              int nveths,
                              char **veths,
                              int appPty,
                              int logfd)
{
    int i;
    int rc;
    int largc = 0, larga = 0;
    const char **largv = NULL;
A
Amy Griffis 已提交
994 995 996 997 998
    int lenvc = 0, lenva = 0;
    const char **lenv = NULL;
    char *filterstr;
    char *outputstr;
    char *tmp;
A
Amy Griffis 已提交
999
    int log_level;
1000 1001
    pid_t child;
    int status;
1002 1003
    fd_set keepfd;
    char appPtyStr[30];
1004
    const char *emulator;
1005 1006

    FD_ZERO(&keepfd);
1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029

#define ADD_ARG_SPACE                                                   \
    do { \
        if (largc == larga) {                                           \
            larga += 10;                                                \
            if (VIR_REALLOC_N(largv, larga) < 0)                        \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ARG(thisarg)                                                \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        largv[largc++] = thisarg;                                       \
    } while (0)

#define ADD_ARG_LIT(thisarg)                                            \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        if ((largv[largc++] = strdup(thisarg)) == NULL)                 \
            goto no_memory;                                             \
    } while (0)

A
Amy Griffis 已提交
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053
#define ADD_ENV_SPACE                                                   \
    do {                                                                \
        if (lenvc == lenva) {                                           \
            lenva += 10;                                                \
            if (VIR_REALLOC_N(lenv, lenva) < 0)                         \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ENV(thisarg)                                                \
    do {                                                                \
        ADD_ENV_SPACE;                                                  \
        lenv[lenvc++] = thisarg;                                        \
    } while (0)

#define ADD_ENV_PAIR(envname, val)                                      \
    do {                                                                \
        char *envval;                                                   \
        ADD_ENV_SPACE;                                                  \
        if (virAsprintf(&envval, "%s=%s", envname, val) < 0)            \
            goto no_memory;                                             \
        lenv[lenvc++] = envval;                                         \
    } while (0)

1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066
#define ADD_ENV_COPY(envname)                                           \
    do {                                                                \
        char *val = getenv(envname);                                    \
        if (val != NULL) {                                              \
            ADD_ENV_PAIR(envname, val);                                 \
        }                                                               \
    } while (0)

    /*
     * The controller may call ip command, so we have to remain PATH.
     */
    ADD_ENV_COPY("PATH");

A
Amy Griffis 已提交
1067 1068
    log_level = virLogGetDefaultPriority();
    if (virAsprintf(&tmp, "LIBVIRT_DEBUG=%d", log_level) < 0)
A
Amy Griffis 已提交
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079
        goto no_memory;
    ADD_ENV(tmp);

    if (virLogGetNbFilters() > 0) {
        filterstr = virLogGetFilters();
        if (!filterstr)
            goto no_memory;
        ADD_ENV_PAIR("LIBVIRT_LOG_FILTERS", filterstr);
        VIR_FREE(filterstr);
    }

A
Amy Griffis 已提交
1080 1081 1082 1083 1084 1085 1086 1087 1088 1089
    if (driver->log_libvirtd) {
        if (virLogGetNbOutputs() > 0) {
            outputstr = virLogGetOutputs();
            if (!outputstr)
                goto no_memory;
            ADD_ENV_PAIR("LIBVIRT_LOG_OUTPUTS", outputstr);
            VIR_FREE(outputstr);
        }
    } else {
        if (virAsprintf(&tmp, "LIBVIRT_LOG_OUTPUTS=%d:stderr", log_level) < 0)
A
Amy Griffis 已提交
1090
            goto no_memory;
A
Amy Griffis 已提交
1091
        ADD_ENV(tmp);
A
Amy Griffis 已提交
1092 1093 1094 1095
    }

    ADD_ENV(NULL);

1096 1097
    snprintf(appPtyStr, sizeof(appPtyStr), "%d", appPty);

1098 1099 1100
    emulator = vm->def->emulator;

    ADD_ARG_LIT(emulator);
1101 1102 1103
    ADD_ARG_LIT("--name");
    ADD_ARG_LIT(vm->def->name);
    ADD_ARG_LIT("--console");
1104
    ADD_ARG_LIT(appPtyStr);
1105 1106 1107 1108 1109 1110 1111 1112 1113
    ADD_ARG_LIT("--background");

    for (i = 0 ; i < nveths ; i++) {
        ADD_ARG_LIT("--veth");
        ADD_ARG_LIT(veths[i]);
    }

    ADD_ARG(NULL);

1114 1115
    FD_SET(appPty, &keepfd);

1116
    if (virExec(largv, lenv, &keepfd, &child,
1117
                -1, &logfd, &logfd,
1118 1119 1120 1121 1122 1123 1124 1125 1126
                VIR_EXEC_NONE) < 0)
        goto cleanup;

    /* We now wait for the process to exit - the controller
     * will fork() itself into the background - waiting for
     * it to exit thus guarentees it has written its pidfile
     */
    while ((rc = waitpid(child, &status, 0) == -1) && errno == EINTR);
    if (rc == -1) {
1127
        virReportSystemError(errno,
1128
                             _("Cannot wait for '%s'"),
1129
                             largv[0]);
1130 1131 1132 1133
        goto cleanup;
    }

    if (!(WIFEXITED(status) && WEXITSTATUS(status) == 0)) {
1134
        lxcError(VIR_ERR_INTERNAL_ERROR,
1135
                 _("Container '%s' unexpectedly shutdown during startup"),
1136 1137 1138 1139 1140 1141 1142
                 largv[0]);
        goto cleanup;
    }

#undef ADD_ARG
#undef ADD_ARG_LIT
#undef ADD_ARG_SPACE
A
Amy Griffis 已提交
1143 1144
#undef ADD_ENV_SPACE
#undef ADD_ENV_PAIR
1145

A
Amy Griffis 已提交
1146
    return 0;
1147 1148

no_memory:
1149
    virReportOOMError();
A
Amy Griffis 已提交
1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161
cleanup:
    if (largv) {
        for (i = 0 ; i < largc ; i++)
            VIR_FREE(largv[i]);
        VIR_FREE(largv);
    }
    if (lenv) {
        for (i=0 ; i < lenvc ; i++)
            VIR_FREE(lenv[i]);
        VIR_FREE(lenv);
    }
    return -1;
1162 1163 1164
}


1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176
/**
 * lxcVmStart:
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to virtual machine structure
 *
 * Starts a vm
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcVmStart(virConnectPtr conn,
                      lxc_driver_t * driver,
1177
                      virDomainObjPtr  vm)
1178
{
1179
    int rc = -1, r;
1180 1181
    unsigned int i;
    int parentTty;
1182
    char *parentTtyPath = NULL;
1183 1184 1185 1186
    char *logfile = NULL;
    int logfd = -1;
    unsigned int nveths = 0;
    char **veths = NULL;
1187
    lxcDomainObjPrivatePtr priv = vm->privateData;
1188

L
Laine Stump 已提交
1189
    if ((r = virFileMakePath(driver->logDir)) != 0) {
1190
        virReportSystemError(r,
1191
                             _("Cannot create log directory '%s'"),
1192
                             driver->logDir);
1193 1194
        return -1;
    }
1195

1196 1197
    if (virAsprintf(&logfile, "%s/%s.log",
                    driver->logDir, vm->def->name) < 0) {
1198
        virReportOOMError();
1199
        return -1;
1200 1201
    }

1202
    /* open parent tty */
1203
    if (virFileOpenTty(&parentTty, &parentTtyPath, 1) < 0) {
1204
        virReportSystemError(errno, "%s",
1205
                             _("Failed to allocate tty"));
1206 1207
        goto cleanup;
    }
1208 1209 1210 1211 1212 1213 1214
    if (vm->def->console &&
        vm->def->console->type == VIR_DOMAIN_CHR_TYPE_PTY) {
        VIR_FREE(vm->def->console->data.file.path);
        vm->def->console->data.file.path = parentTtyPath;
    } else {
        VIR_FREE(parentTtyPath);
    }
1215

1216
    if (lxcSetupInterfaces(conn, vm->def, &nveths, &veths) != 0)
1217
        goto cleanup;
1218

1219
    /* Persist the live configuration now we have veth & tty info */
1220
    if (virDomainSaveConfig(driver->stateDir, vm->def) < 0)
1221 1222
        goto cleanup;

1223
    if ((logfd = open(logfile, O_WRONLY | O_APPEND | O_CREAT,
1224
             S_IRUSR|S_IWUSR)) < 0) {
1225
        virReportSystemError(errno,
1226
                             _("Failed to open '%s'"),
1227
                             logfile);
1228
        goto cleanup;
1229 1230
    }

1231
    if (lxcControllerStart(driver,
1232 1233 1234
                           vm,
                           nveths, veths,
                           parentTty, logfd) < 0)
1235
        goto cleanup;
1236 1237 1238 1239

    /* Connect to the controller as a client *first* because
     * this will block until the child has written their
     * pid file out to disk */
1240
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0)
1241 1242
        goto cleanup;

1243
    /* And get its pid */
1244
    if ((r = virFileReadPid(driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1245
        virReportSystemError(r,
1246 1247
                             _("Failed to read pid file %s/%s.pid"),
                             driver->stateDir, vm->def->name);
1248
        goto cleanup;
1249
    }
1250

1251
    vm->def->id = vm->pid;
1252 1253
    vm->state = VIR_DOMAIN_RUNNING;

1254 1255
    if ((priv->monitorWatch = virEventAddHandle(
             priv->monitor,
1256 1257
             VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
             lxcMonitorEvent,
1258
             vm, NULL)) < 0) {
1259
        lxcVmTerminate(driver, vm, 0);
1260 1261
        goto cleanup;
    }
1262

1263 1264 1265 1266 1267 1268 1269 1270
    rc = 0;

cleanup:
    for (i = 0 ; i < nveths ; i++) {
        if (rc != 0)
            vethDelete(veths[i]);
        VIR_FREE(veths[i]);
    }
1271 1272 1273
    if (rc != 0 && priv->monitor != -1) {
        close(priv->monitor);
        priv->monitor = -1;
1274 1275 1276 1277 1278 1279
    }
    if (parentTty != -1)
        close(parentTty);
    if (logfd != -1)
        close(logfd);
    VIR_FREE(logfile);
1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292
    return rc;
}

/**
 * lxcDomainStart:
 * @dom: domain to start
 *
 * Looks up domain and starts it.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainStart(virDomainPtr dom)
{
1293 1294
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1295
    virDomainEventPtr event = NULL;
1296
    int ret = -1;
1297

1298
    lxcDriverLock(driver);
1299
    vm = virDomainFindByName(&driver->domains, dom->name);
1300
    if (!vm) {
1301
        lxcError(VIR_ERR_INVALID_DOMAIN,
1302
                 _("No domain named %s"), dom->name);
1303 1304 1305
        goto cleanup;
    }

1306
    if ((vm->def->nets != NULL) && !(driver->have_netns)) {
1307
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1308
                 "%s", _("System lacks NETNS support"));
1309 1310 1311
        goto cleanup;
    }

1312
    ret = lxcVmStart(dom->conn, driver, vm);
1313

1314 1315 1316 1317 1318
    if (ret == 0)
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);

1319
cleanup:
1320 1321
    if (vm)
        virDomainObjUnlock(vm);
1322 1323
    if (event)
        lxcDomainEventQueue(driver, event);
1324
    lxcDriverUnlock(driver);
1325
    return ret;
1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341
}

/**
 * lxcDomainCreateAndStart:
 * @conn: pointer to connection
 * @xml: XML definition of domain
 * @flags: Unused
 *
 * Creates a domain based on xml and starts it
 *
 * Returns 0 on success or -1 in case of error
 */
static virDomainPtr
lxcDomainCreateAndStart(virConnectPtr conn,
                        const char *xml,
                        unsigned int flags ATTRIBUTE_UNUSED) {
1342
    lxc_driver_t *driver = conn->privateData;
1343
    virDomainObjPtr vm = NULL;
1344
    virDomainDefPtr def;
1345
    virDomainPtr dom = NULL;
1346
    virDomainEventPtr event = NULL;
1347

1348
    lxcDriverLock(driver);
1349
    if (!(def = virDomainDefParseString(driver->caps, xml,
1350
                                        VIR_DOMAIN_XML_INACTIVE)))
1351
        goto cleanup;
1352

1353 1354
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
1355

1356
    if ((def->nets != NULL) && !(driver->have_netns)) {
1357
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1358
                 "%s", _("System lacks NETNS support"));
1359
        goto cleanup;
1360 1361
    }

1362

1363
    if (!(vm = virDomainAssignDef(driver->caps,
1364
                                  &driver->domains, def)))
1365 1366
        goto cleanup;
    def = NULL;
1367 1368

    if (lxcVmStart(conn, driver, vm) < 0) {
1369
        virDomainRemoveInactive(&driver->domains, vm);
1370
        vm = NULL;
1371
        goto cleanup;
1372 1373
    }

1374 1375 1376 1377
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);

1378
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
1379
    if (dom)
1380 1381
        dom->id = vm->def->id;

1382 1383
cleanup:
    virDomainDefFree(def);
1384 1385
    if (vm)
        virDomainObjUnlock(vm);
1386 1387
    if (event)
        lxcDomainEventQueue(driver, event);
1388
    lxcDriverUnlock(driver);
1389 1390 1391 1392 1393
    return dom;
}

/**
 * lxcDomainShutdown:
1394
 * @dom: pointer to domain to shutdown
1395 1396 1397 1398 1399 1400 1401
 *
 * Sends SIGINT to container root process to request it to shutdown
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainShutdown(virDomainPtr dom)
{
1402 1403
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1404
    virDomainEventPtr event = NULL;
1405
    int ret = -1;
1406

1407
    lxcDriverLock(driver);
1408
    vm = virDomainFindByID(&driver->domains, dom->id);
1409
    if (!vm) {
1410
        lxcError(VIR_ERR_INVALID_DOMAIN,
1411
                 _("No domain with id %d"), dom->id);
1412
        goto cleanup;
1413 1414
    }

1415
    ret = lxcVmTerminate(driver, vm, 0);
1416 1417 1418
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
1419 1420 1421 1422
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1423 1424

cleanup:
1425 1426
    if (vm)
        virDomainObjUnlock(vm);
1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445
    if (event)
        lxcDomainEventQueue(driver, event);
    lxcDriverUnlock(driver);
    return ret;
}


static int
lxcDomainEventRegister (virConnectPtr conn,
                        virConnectDomainEventCallback callback,
                        void *opaque,
                        virFreeCallback freecb)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    ret = virDomainEventCallbackListAdd(conn, driver->domainEventCallbacks,
                                        callback, opaque, freecb);
1446
    lxcDriverUnlock(driver);
1447

1448
    return ret;
1449 1450
}

1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523
static int
lxcDomainEventDeregister (virConnectPtr conn,
                          virConnectDomainEventCallback callback)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDelete(conn, driver->domainEventCallbacks,
                                                   callback);
    else
        ret = virDomainEventCallbackListRemove(conn, driver->domainEventCallbacks,
                                               callback);
    lxcDriverUnlock(driver);

    return ret;
}

static void lxcDomainEventDispatchFunc(virConnectPtr conn,
                                       virDomainEventPtr event,
                                       virConnectDomainEventCallback cb,
                                       void *cbopaque,
                                       void *opaque)
{
    lxc_driver_t *driver = opaque;

    /* Drop the lock whle dispatching, for sake of re-entrancy */
    lxcDriverUnlock(driver);
    virDomainEventDispatchDefaultFunc(conn, event, cb, cbopaque, NULL);
    lxcDriverLock(driver);
}


static void lxcDomainEventFlush(int timer ATTRIBUTE_UNUSED, void *opaque)
{
    lxc_driver_t *driver = opaque;
    virDomainEventQueue tempQueue;

    lxcDriverLock(driver);

    driver->domainEventDispatching = 1;

    /* Copy the queue, so we're reentrant safe */
    tempQueue.count = driver->domainEventQueue->count;
    tempQueue.events = driver->domainEventQueue->events;
    driver->domainEventQueue->count = 0;
    driver->domainEventQueue->events = NULL;

    virEventUpdateTimeout(driver->domainEventTimer, -1);
    virDomainEventQueueDispatch(&tempQueue,
                                driver->domainEventCallbacks,
                                lxcDomainEventDispatchFunc,
                                driver);

    /* Purge any deleted callbacks */
    virDomainEventCallbackListPurgeMarked(driver->domainEventCallbacks);

    driver->domainEventDispatching = 0;
    lxcDriverUnlock(driver);
}


/* driver must be locked before calling */
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                 virDomainEventPtr event)
{
    if (virDomainEventQueuePush(driver->domainEventQueue,
                                event) < 0)
        virDomainEventFree(event);
    if (lxc_driver->domainEventQueue->count == 1)
        virEventUpdateTimeout(driver->domainEventTimer, 0);
}
1524 1525 1526

/**
 * lxcDomainDestroy:
1527
 * @dom: pointer to domain to destroy
1528 1529 1530 1531 1532 1533 1534
 *
 * Sends SIGKILL to container root process to terminate the container
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainDestroy(virDomainPtr dom)
{
1535 1536
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1537
    virDomainEventPtr event = NULL;
1538
    int ret = -1;
1539

1540
    lxcDriverLock(driver);
1541
    vm = virDomainFindByID(&driver->domains, dom->id);
1542
    if (!vm) {
1543
        lxcError(VIR_ERR_INVALID_DOMAIN,
1544
                 _("No domain with id %d"), dom->id);
1545
        goto cleanup;
1546 1547
    }

1548
    ret = lxcVmTerminate(driver, vm, SIGKILL);
1549 1550 1551
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_DESTROYED);
1552 1553 1554 1555
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1556 1557

cleanup:
1558 1559
    if (vm)
        virDomainObjUnlock(vm);
1560 1561
    if (event)
        lxcDomainEventQueue(driver, event);
1562
    lxcDriverUnlock(driver);
1563
    return ret;
1564
}
1565

1566 1567 1568 1569 1570
static int lxcCheckNetNsSupport(void)
{
    const char *argv[] = {"ip", "link", "set", "lo", "netns", "-1", NULL};
    int ip_rc;

1571
    if (virRun(argv, &ip_rc) < 0 ||
1572 1573
        !(WIFEXITED(ip_rc) && (WEXITSTATUS(ip_rc) != 255)))
        return 0;
1574

1575 1576
    if (lxcContainerAvailable(LXC_CONTAINER_FEATURE_NET) < 0)
        return 0;
1577

1578
    return 1;
1579 1580
}

1581

1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594
struct lxcAutostartData {
    lxc_driver_t *driver;
    virConnectPtr conn;
};

static void
lxcAutostartDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    const struct lxcAutostartData *data = opaque;

    virDomainObjLock(vm);
    if (vm->autostart &&
D
Daniel P. Berrange 已提交
1595
        !virDomainObjIsActive(vm)) {
1596 1597 1598
        int ret = lxcVmStart(data->conn, data->driver, vm);
        if (ret < 0) {
            virErrorPtr err = virGetLastError();
1599
            VIR_ERROR(_("Failed to autostart VM '%s': %s"),
1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613
                      vm->def->name,
                      err ? err->message : "");
        } else {
            virDomainEventPtr event =
                virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);
            if (event)
                lxcDomainEventQueue(data->driver, event);
        }
    }
    virDomainObjUnlock(vm);
}

1614 1615 1616 1617 1618 1619 1620 1621 1622 1623
static void
lxcAutostartConfigs(lxc_driver_t *driver) {
    /* XXX: Figure out a better way todo this. The domain
     * startup code needs a connection handle in order
     * to lookup the bridge associated with a virtual
     * network
     */
    virConnectPtr conn = virConnectOpen("lxc:///");
    /* Ignoring NULL conn which is mostly harmless here */

1624 1625
    struct lxcAutostartData data = { driver, conn };

1626
    lxcDriverLock(driver);
1627
    virHashForEach(driver->domains.objs, lxcAutostartDomain, &data);
1628 1629 1630 1631 1632 1633
    lxcDriverUnlock(driver);

    if (conn)
        virConnectClose(conn);
}

1634 1635 1636 1637 1638 1639 1640
static void
lxcReconnectVM(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    lxc_driver_t *driver = opaque;
    char *config = NULL;
    virDomainDefPtr tmp;
1641
    lxcDomainObjPrivatePtr priv;
1642 1643

    virDomainObjLock(vm);
1644 1645

    priv = vm->privateData;
1646
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0) {
1647 1648 1649 1650 1651
        goto cleanup;
    }

    /* Read pid from controller */
    if ((virFileReadPid(lxc_driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1652 1653
        close(priv->monitor);
        priv->monitor = -1;
1654 1655 1656
        goto cleanup;
    }

1657
    if ((config = virDomainConfigFile(driver->stateDir,
1658 1659 1660 1661
                                      vm->def->name)) == NULL)
        goto cleanup;

    /* Try and load the live config */
1662
    tmp = virDomainDefParseFile(driver->caps, config, 0);
1663 1664 1665 1666 1667 1668 1669 1670 1671
    VIR_FREE(config);
    if (tmp) {
        vm->newDef = vm->def;
        vm->def = tmp;
    }

    if (vm->pid != 0) {
        vm->def->id = vm->pid;
        vm->state = VIR_DOMAIN_RUNNING;
1672 1673 1674 1675 1676 1677

        if ((priv->monitorWatch = virEventAddHandle(
                 priv->monitor,
                 VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
                 lxcMonitorEvent,
                 vm, NULL)) < 0) {
1678
            lxcVmTerminate(driver, vm, 0);
1679 1680
            goto cleanup;
        }
1681 1682
    } else {
        vm->def->id = -1;
1683 1684
        close(priv->monitor);
        priv->monitor = -1;
1685 1686 1687 1688 1689 1690
    }

cleanup:
    virDomainObjUnlock(vm);
}

1691

1692
static int lxcStartup(int privileged)
D
Daniel Veillard 已提交
1693
{
1694
    char *ld;
1695
    int rc;
1696 1697 1698 1699 1700 1701

    /* Valgrind gets very annoyed when we clone containers, so
     * disable LXC when under valgrind
     * XXX remove this when valgrind is fixed
     */
    ld = getenv("LD_PRELOAD");
1702 1703 1704 1705
    if (ld && strstr(ld, "vgpreload")) {
        VIR_INFO0("Running under valgrind, disabling driver");
        return 0;
    }
1706

1707
    /* Check that the user is root, silently disable if not */
1708
    if (!privileged) {
1709 1710 1711 1712 1713 1714 1715 1716
        VIR_INFO0("Not running privileged, disabling driver");
        return 0;
    }

    /* Check that this is a container enabled kernel */
    if (lxcContainerAvailable(0) < 0) {
        VIR_INFO0("LXC support not available in this kernel, disabling driver");
        return 0;
1717 1718
    }

1719
    if (VIR_ALLOC(lxc_driver) < 0) {
1720 1721
        return -1;
    }
1722 1723 1724 1725
    if (virMutexInit(&lxc_driver->lock) < 0) {
        VIR_FREE(lxc_driver);
        return -1;
    }
1726
    lxcDriverLock(lxc_driver);
D
Daniel Veillard 已提交
1727

1728 1729 1730
    if (virDomainObjListInit(&lxc_driver->domains) < 0)
        goto cleanup;

1731
    if (VIR_ALLOC(lxc_driver->domainEventCallbacks) < 0)
1732 1733 1734 1735 1736 1737 1738 1739
        goto cleanup;
    if (!(lxc_driver->domainEventQueue = virDomainEventQueueNew()))
        goto cleanup;

    if ((lxc_driver->domainEventTimer =
         virEventAddTimeout(-1, lxcDomainEventFlush, lxc_driver, NULL)) < 0)
        goto cleanup;

A
Amy Griffis 已提交
1740
    lxc_driver->log_libvirtd = 0; /* by default log to container logfile */
1741
    lxc_driver->have_netns = lxcCheckNetNsSupport();
D
Daniel Veillard 已提交
1742

1743 1744 1745 1746 1747 1748 1749
    rc = virCgroupForDriver("lxc", &lxc_driver->cgroup, privileged, 1);
    if (rc < 0) {
        char buf[1024];
        VIR_WARN("Unable to create cgroup for driver: %s",
                 virStrerror(-rc, buf, sizeof(buf)));
    }

D
Daniel Veillard 已提交
1750
    /* Call function to load lxc driver configuration information */
1751 1752
    if (lxcLoadDriverConfig(lxc_driver) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
1753

1754 1755
    if ((lxc_driver->caps = lxcCapsInit()) == NULL)
        goto cleanup;
D
Daniel Veillard 已提交
1756

1757 1758 1759
    lxc_driver->caps->privateDataAllocFunc = lxcDomainObjPrivateAlloc;
    lxc_driver->caps->privateDataFreeFunc = lxcDomainObjPrivateFree;

1760
    if (virDomainLoadAllConfigs(lxc_driver->caps,
1761 1762
                                &lxc_driver->domains,
                                lxc_driver->configDir,
1763
                                lxc_driver->autostartDir,
1764
                                0, NULL, NULL) < 0)
1765
        goto cleanup;
1766

1767
    virHashForEach(lxc_driver->domains.objs, lxcReconnectVM, lxc_driver);
1768

1769
    lxcDriverUnlock(lxc_driver);
D
Daniel Veillard 已提交
1770 1771
    return 0;

1772 1773 1774 1775
cleanup:
    lxcDriverUnlock(lxc_driver);
    lxcShutdown();
    return -1;
D
Daniel Veillard 已提交
1776 1777
}

1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803
static void lxcNotifyLoadDomain(virDomainObjPtr vm, int newVM, void *opaque)
{
    lxc_driver_t *driver = opaque;

    if (newVM) {
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED);
        if (event)
            lxcDomainEventQueue(driver, event);
    }
}

/**
 * lxcReload:
 *
 * Function to restart the LXC driver, it will recheck the configuration
 * files and perform autostart
 */
static int
lxcReload(void) {
    if (!lxc_driver)
        return 0;

    lxcDriverLock(lxc_driver);
1804
    virDomainLoadAllConfigs(lxc_driver->caps,
1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815
                            &lxc_driver->domains,
                            lxc_driver->configDir,
                            lxc_driver->autostartDir,
                            0, lxcNotifyLoadDomain, lxc_driver);
    lxcDriverUnlock(lxc_driver);

    lxcAutostartConfigs(lxc_driver);

    return 0;
}

1816
static int lxcShutdown(void)
D
Daniel Veillard 已提交
1817
{
1818
    if (lxc_driver == NULL)
1819
        return(-1);
1820

1821
    lxcDriverLock(lxc_driver);
1822
    virDomainObjListDeinit(&lxc_driver->domains);
1823

1824 1825 1826 1827 1828 1829
    virDomainEventCallbackListFree(lxc_driver->domainEventCallbacks);
    virDomainEventQueueFree(lxc_driver->domainEventQueue);

    if (lxc_driver->domainEventTimer != -1)
        virEventRemoveTimeout(lxc_driver->domainEventTimer);

1830 1831 1832 1833 1834 1835
    virCapabilitiesFree(lxc_driver->caps);
    VIR_FREE(lxc_driver->configDir);
    VIR_FREE(lxc_driver->autostartDir);
    VIR_FREE(lxc_driver->stateDir);
    VIR_FREE(lxc_driver->logDir);
    lxcDriverUnlock(lxc_driver);
1836
    virMutexDestroy(&lxc_driver->lock);
1837
    VIR_FREE(lxc_driver);
1838 1839 1840

    return 0;
}
D
Daniel Veillard 已提交
1841

1842 1843 1844 1845 1846 1847 1848 1849 1850
/**
 * lxcActive:
 *
 * Checks if the LXC daemon is active, i.e. has an active domain
 *
 * Returns 1 if active, 0 otherwise
 */
static int
lxcActive(void) {
1851
    int active;
1852

1853 1854
    if (lxc_driver == NULL)
        return(0);
1855

1856
    lxcDriverLock(lxc_driver);
1857
    active = virDomainObjListNumOfDomains(&lxc_driver->domains, 1);
1858
    lxcDriverUnlock(lxc_driver);
1859

1860
    return active;
D
Daniel Veillard 已提交
1861 1862
}

1863
static int lxcVersion(virConnectPtr conn ATTRIBUTE_UNUSED, unsigned long *version)
D
Dan Smith 已提交
1864 1865 1866 1867 1868 1869
{
    struct utsname ver;
    int maj;
    int min;
    int rev;

1870
    uname(&ver);
D
Dan Smith 已提交
1871 1872

    if (sscanf(ver.release, "%i.%i.%i", &maj, &min, &rev) != 3) {
1873
        lxcError(VIR_ERR_INTERNAL_ERROR,
D
Dan Smith 已提交
1874 1875 1876 1877 1878 1879 1880 1881
                 _("Unknown release: %s"), ver.release);
        return -1;
    }

    *version = (maj * 1000 * 1000) + (min * 1000) + rev;

    return 0;
}
1882

1883 1884
static char *lxcGetSchedulerType(virDomainPtr domain ATTRIBUTE_UNUSED,
                                 int *nparams)
1885
{
1886 1887
    char *schedulerType = NULL;

1888 1889 1890
    if (nparams)
        *nparams = 1;

1891 1892 1893
    schedulerType = strdup("posix");

    if (schedulerType == NULL)
1894
        virReportOOMError();
1895 1896

    return schedulerType;
1897 1898
}

1899
static int lxcSetSchedulerParameters(virDomainPtr domain,
1900 1901 1902
                                     virSchedParameterPtr params,
                                     int nparams)
{
1903
    lxc_driver_t *driver = domain->conn->privateData;
1904
    int i;
1905 1906 1907
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;
1908

1909
    if (driver->cgroup == NULL)
1910 1911 1912 1913
        return -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
1914

1915
    if (vm == NULL) {
1916
        lxcError(VIR_ERR_INTERNAL_ERROR,
1917 1918
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
1919 1920
    }

1921
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
1922
        goto cleanup;
1923 1924 1925

    for (i = 0; i < nparams; i++) {
        virSchedParameterPtr param = &params[i];
1926
        if (param->type != VIR_DOMAIN_SCHED_FIELD_ULLONG) {
1927
            lxcError(VIR_ERR_INVALID_ARG, "%s",
1928
                     _("Invalid type for cpu_shares tunable, expected a 'ullong'"));
1929 1930
            goto cleanup;
        }
1931 1932

        if (STREQ(param->field, "cpu_shares")) {
1933
            if (virCgroupSetCpuShares(group, params[i].value.ul) != 0)
1934
                goto cleanup;
1935
        } else {
1936
            lxcError(VIR_ERR_INVALID_ARG,
1937
                     _("Invalid parameter `%s'"), param->field);
1938
            goto cleanup;
1939 1940
        }
    }
1941
    ret = 0;
1942

1943
cleanup:
1944
    lxcDriverUnlock(driver);
1945
    virCgroupFree(&group);
1946 1947
    if (vm)
        virDomainObjUnlock(vm);
1948
    return ret;
1949 1950
}

1951
static int lxcGetSchedulerParameters(virDomainPtr domain,
1952 1953 1954
                                     virSchedParameterPtr params,
                                     int *nparams)
{
1955
    lxc_driver_t *driver = domain->conn->privateData;
1956 1957
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
1958
    unsigned long long val;
1959
    int ret = -1;
1960

1961
    if (driver->cgroup == NULL)
1962
        return -1;
1963 1964

    if ((*nparams) != 1) {
1965
        lxcError(VIR_ERR_INVALID_ARG,
J
Jim Meyering 已提交
1966
                 "%s", _("Invalid parameter count"));
1967
        return -1;
1968 1969
    }

1970 1971 1972
    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);

1973
    if (vm == NULL) {
1974
        lxcError(VIR_ERR_INTERNAL_ERROR,
1975 1976
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
1977 1978
    }

1979
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
1980
        goto cleanup;
1981

1982 1983
    if (virCgroupGetCpuShares(group, &val) != 0)
        goto cleanup;
1984
    params[0].value.ul = val;
C
Chris Lalancette 已提交
1985
    if (virStrcpyStatic(params[0].field, "cpu_shares") == NULL) {
1986
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
1987 1988 1989
                 "%s", _("Field cpu_shares too big for destination"));
        goto cleanup;
    }
1990 1991
    params[0].type = VIR_DOMAIN_SCHED_FIELD_ULLONG;

1992
    ret = 0;
1993

1994
cleanup:
1995
    lxcDriverUnlock(driver);
1996
    virCgroupFree(&group);
1997 1998
    if (vm)
        virDomainObjUnlock(vm);
1999
    return ret;
2000 2001
}

2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019
#ifdef __linux__
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path,
                        struct _virDomainInterfaceStats *stats)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int i;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2020
        lxcError(VIR_ERR_NO_DOMAIN,
2021 2022 2023 2024 2025
                 _("No domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
2026
        lxcError(VIR_ERR_OPERATION_INVALID,
2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040
                 "%s", _("Domain is not running"));
        goto cleanup;
    }

    /* Check the path is one of the domain's network interfaces. */
    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (vm->def->nets[i]->ifname &&
            STREQ(vm->def->nets[i]->ifname, path)) {
            ret = 0;
            break;
        }
    }

    if (ret == 0)
2041
        ret = linuxDomainInterfaceStats(path, stats);
2042
    else
2043
        lxcError(VIR_ERR_INVALID_ARG,
2044 2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055
                 _("Invalid path, '%s' is not a known interface"), path);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}
#else
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path ATTRIBUTE_UNUSED,
                        struct _virDomainInterfaceStats *stats ATTRIBUTE_UNUSED)
2056
    lxcError(VIR_ERR_NO_SUPPORT, "%s", __FUNCTION__);
2057 2058 2059 2060
    return -1;
}
#endif

2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073
static int lxcDomainGetAutostart(virDomainPtr dom,
                                   int *autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2074
        lxcError(VIR_ERR_NO_DOMAIN,
2075
                 _("No domain with matching uuid '%s'"), uuidstr);
2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100
        goto cleanup;
    }

    *autostart = vm->autostart;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetAutostart(virDomainPtr dom,
                                   int autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *configFile = NULL, *autostartLink = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2101
        lxcError(VIR_ERR_NO_DOMAIN,
2102
                 _("No domain with matching uuid '%s'"), uuidstr);
2103 2104 2105 2106
        goto cleanup;
    }

    if (!vm->persistent) {
2107
        lxcError(VIR_ERR_INTERNAL_ERROR,
2108
                 "%s", _("Cannot set autostart for transient domain"));
2109 2110 2111 2112 2113
        goto cleanup;
    }

    autostart = (autostart != 0);

2114 2115 2116 2117
    if (vm->autostart == autostart) {
        ret = 0;
        goto cleanup;
    }
2118

2119
    configFile = virDomainConfigFile(driver->configDir,
2120 2121 2122
                                     vm->def->name);
    if (configFile == NULL)
        goto cleanup;
2123
    autostartLink = virDomainConfigFile(driver->autostartDir,
2124 2125 2126
                                        vm->def->name);
    if (autostartLink == NULL)
        goto cleanup;
2127

2128 2129
    if (autostart) {
        int err;
2130

2131
        if ((err = virFileMakePath(driver->autostartDir))) {
2132
            virReportSystemError(err,
2133 2134 2135
                                 _("Cannot create autostart directory %s"),
                                 driver->autostartDir);
            goto cleanup;
2136 2137
        }

2138
        if (symlink(configFile, autostartLink) < 0) {
2139
            virReportSystemError(errno,
2140 2141 2142 2143 2144 2145
                                 _("Failed to create symlink '%s to '%s'"),
                                 autostartLink, configFile);
            goto cleanup;
        }
    } else {
        if (unlink(autostartLink) < 0 && errno != ENOENT && errno != ENOTDIR) {
2146
            virReportSystemError(errno,
2147 2148 2149 2150
                                 _("Failed to delete symlink '%s'"),
                                 autostartLink);
            goto cleanup;
        }
2151
    }
2152 2153

    vm->autostart = autostart;
2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164
    ret = 0;

cleanup:
    VIR_FREE(configFile);
    VIR_FREE(autostartLink);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

R
Ryota Ozaki 已提交
2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269
static int lxcFreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int timeout = 1000; /* In milliseconds */
    int check_interval = 1; /* In milliseconds */
    int exp = 10;
    int waited_time = 0;
    int ret = -1;
    char *state = NULL;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    while (waited_time < timeout) {
        int r;
        /*
         * Writing "FROZEN" to the "freezer.state" freezes the group,
         * i.e., the container, temporarily transiting "FREEZING" state.
         * Once the freezing is completed, the state of the group transits
         * to "FROZEN".
         * (see linux-2.6/Documentation/cgroups/freezer-subsystem.txt)
         */
        r = virCgroupSetFreezerState(cgroup, "FROZEN");

        /*
         * Returning EBUSY explicitly indicates that the group is
         * being freezed but incomplete and other errors are true
         * errors.
         */
        if (r < 0 && r != -EBUSY) {
            VIR_DEBUG("Writing freezer.state failed with errno: %d", r);
            goto error;
        }
        if (r == -EBUSY)
            VIR_DEBUG0("Writing freezer.state gets EBUSY");

        /*
         * Unfortunately, returning 0 (success) is likely to happen
         * even when the freezing has not been completed. Sometimes
         * the state of the group remains "FREEZING" like when
         * returning -EBUSY and even worse may never transit to
         * "FROZEN" even if writing "FROZEN" again.
         *
         * So we don't trust the return value anyway and always
         * decide that the freezing has been complete only with
         * the state actually transit to "FROZEN".
         */
        usleep(check_interval * 1000);

        r = virCgroupGetFreezerState(cgroup, &state);

        if (r < 0) {
            VIR_DEBUG("Reading freezer.state failed with errno: %d", r);
            goto error;
        }
        VIR_DEBUG("Read freezer.state: %s", state);

        if (STREQ(state, "FROZEN")) {
            ret = 0;
            goto cleanup;
        }

        waited_time += check_interval;
        /*
         * Increasing check_interval exponentially starting with
         * small initial value treats nicely two cases; One is
         * a container is under no load and waiting for long period
         * makes no sense. The other is under heavy load. The container
         * may stay longer time in FREEZING or never transit to FROZEN.
         * In that case, eager polling will just waste CPU time.
         */
        check_interval *= exp;
        VIR_FREE(state);
    }
    VIR_DEBUG0("lxcFreezeContainer timeout");
error:
    /*
     * If timeout or an error on reading the state occurs,
     * activate the group again and return an error.
     * This is likely to fall the group back again gracefully.
     */
    virCgroupSetFreezerState(cgroup, "THAWED");
    ret = -1;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);
    VIR_FREE(state);
    return ret;
}

static int lxcDomainSuspend(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2270
        lxcError(VIR_ERR_NO_DOMAIN,
2271
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2272 2273 2274
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2275
    if (!virDomainObjIsActive(vm)) {
2276
        lxcError(VIR_ERR_OPERATION_INVALID,
2277
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2278 2279 2280 2281 2282
        goto cleanup;
    }

    if (vm->state != VIR_DOMAIN_PAUSED) {
        if (lxcFreezeContainer(driver, vm) < 0) {
2283
            lxcError(VIR_ERR_OPERATION_FAILED,
2284
                     "%s", _("Suspend operation failed"));
R
Ryota Ozaki 已提交
2285 2286 2287 2288 2289 2290 2291 2292 2293
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_PAUSED;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
    }

2294
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

static int lxcUnfreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int ret;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    ret = virCgroupSetFreezerState(cgroup, "THAWED");

    virCgroupFree(&cgroup);
    return ret;
}

static int lxcDomainResume(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2335
        lxcError(VIR_ERR_NO_DOMAIN,
2336
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2337 2338 2339
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2340
    if (!virDomainObjIsActive(vm)) {
2341
        lxcError(VIR_ERR_OPERATION_INVALID,
2342
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2343 2344 2345 2346 2347
        goto cleanup;
    }

    if (vm->state == VIR_DOMAIN_PAUSED) {
        if (lxcUnfreezeContainer(driver, vm) < 0) {
2348
            lxcError(VIR_ERR_OPERATION_FAILED,
2349
                     "%s", _("Resume operation failed"));
R
Ryota Ozaki 已提交
2350 2351 2352 2353 2354 2355 2356 2357 2358
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_RUNNING;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_UNPAUSED);
    }

2359
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}


D
Daniel Veillard 已提交
2373 2374 2375 2376 2377 2378 2379 2380
/* Function Tables */
static virDriver lxcDriver = {
    VIR_DRV_LXC, /* the number virDrvNo */
    "LXC", /* the name of the driver */
    lxcOpen, /* open */
    lxcClose, /* close */
    NULL, /* supports_feature */
    NULL, /* type */
D
Dan Smith 已提交
2381
    lxcVersion, /* version */
2382
    NULL, /* libvirtVersion (impl. in libvirt.c) */
2383
    virGetHostname, /* getHostname */
D
Daniel Veillard 已提交
2384
    NULL, /* getMaxVcpus */
2385 2386
    nodeGetInfo, /* nodeGetInfo */
    lxcGetCapabilities, /* getCapabilities */
D
Daniel Veillard 已提交
2387 2388
    lxcListDomains, /* listDomains */
    lxcNumDomains, /* numOfDomains */
2389
    lxcDomainCreateAndStart, /* domainCreateXML */
D
Daniel Veillard 已提交
2390 2391 2392
    lxcDomainLookupByID, /* domainLookupByID */
    lxcDomainLookupByUUID, /* domainLookupByUUID */
    lxcDomainLookupByName, /* domainLookupByName */
R
Ryota Ozaki 已提交
2393 2394
    lxcDomainSuspend, /* domainSuspend */
    lxcDomainResume, /* domainResume */
2395
    lxcDomainShutdown, /* domainShutdown */
D
Daniel Veillard 已提交
2396
    NULL, /* domainReboot */
2397
    lxcDomainDestroy, /* domainDestroy */
D
Daniel Veillard 已提交
2398
    lxcGetOSType, /* domainGetOSType */
R
Ryota Ozaki 已提交
2399 2400 2401
    lxcDomainGetMaxMemory, /* domainGetMaxMemory */
    lxcDomainSetMaxMemory, /* domainSetMaxMemory */
    lxcDomainSetMemory, /* domainSetMemory */
D
Daniel Veillard 已提交
2402 2403 2404 2405 2406 2407 2408 2409
    lxcDomainGetInfo, /* domainGetInfo */
    NULL, /* domainSave */
    NULL, /* domainRestore */
    NULL, /* domainCoreDump */
    NULL, /* domainSetVcpus */
    NULL, /* domainPinVcpu */
    NULL, /* domainGetVcpus */
    NULL, /* domainGetMaxVcpus */
2410 2411
    NULL, /* domainGetSecurityLabel */
    NULL, /* nodeGetSecurityModel */
D
Daniel Veillard 已提交
2412
    lxcDomainDumpXML, /* domainDumpXML */
2413 2414
    NULL, /* domainXMLFromNative */
    NULL, /* domainXMLToNative */
D
Daniel Veillard 已提交
2415 2416
    lxcListDefinedDomains, /* listDefinedDomains */
    lxcNumDefinedDomains, /* numOfDefinedDomains */
2417
    lxcDomainStart, /* domainCreate */
D
Daniel Veillard 已提交
2418 2419 2420
    lxcDomainDefine, /* domainDefineXML */
    lxcDomainUndefine, /* domainUndefine */
    NULL, /* domainAttachDevice */
2421
    NULL, /* domainAttachDeviceFlags */
D
Daniel Veillard 已提交
2422
    NULL, /* domainDetachDevice */
2423
    NULL, /* domainDetachDeviceFlags */
2424 2425
    lxcDomainGetAutostart, /* domainGetAutostart */
    lxcDomainSetAutostart, /* domainSetAutostart */
2426 2427 2428
    lxcGetSchedulerType, /* domainGetSchedulerType */
    lxcGetSchedulerParameters, /* domainGetSchedulerParameters */
    lxcSetSchedulerParameters, /* domainSetSchedulerParameters */
D
Daniel Veillard 已提交
2429 2430 2431 2432
    NULL, /* domainMigratePrepare */
    NULL, /* domainMigratePerform */
    NULL, /* domainMigrateFinish */
    NULL, /* domainBlockStats */
2433
    lxcDomainInterfaceStats, /* domainInterfaceStats */
2434
    NULL, /* domainMemoryStats */
D
Daniel P. Berrange 已提交
2435 2436
    NULL, /* domainBlockPeek */
    NULL, /* domainMemoryPeek */
2437 2438
    nodeGetCellsFreeMemory, /* nodeGetCellsFreeMemory */
    nodeGetFreeMemory,  /* getFreeMemory */
2439 2440
    lxcDomainEventRegister, /* domainEventRegister */
    lxcDomainEventDeregister, /* domainEventDeregister */
D
Daniel Veillard 已提交
2441 2442
    NULL, /* domainMigratePrepare2 */
    NULL, /* domainMigrateFinish2 */
2443
    NULL, /* nodeDeviceDettach */
2444 2445
    NULL, /* nodeDeviceReAttach */
    NULL, /* nodeDeviceReset */
C
Chris Lalancette 已提交
2446
    NULL, /* domainMigratePrepareTunnel */
2447 2448 2449 2450
    lxcIsEncrypted,
    lxcIsSecure,
    lxcDomainIsActive,
    lxcDomainIsPersistent,
J
Jiri Denemark 已提交
2451
    NULL, /* cpuCompare */
D
Daniel Veillard 已提交
2452 2453
};

2454
static virStateDriver lxcStateDriver = {
2455
    .name = "LXC",
2456 2457 2458
    .initialize = lxcStartup,
    .cleanup = lxcShutdown,
    .active = lxcActive,
2459
    .reload = lxcReload,
2460 2461
};

D
Daniel Veillard 已提交
2462 2463 2464
int lxcRegister(void)
{
    virRegisterDriver(&lxcDriver);
2465
    virRegisterStateDriver(&lxcStateDriver);
D
Daniel Veillard 已提交
2466 2467
    return 0;
}