lxc_driver.c 67.5 KB
Newer Older
D
Daniel Veillard 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright IBM Corp. 2008
 *
 * lxc_driver.c: linux container driver functions
 *
 * Authors:
 *  David L. Leskovec <dlesko at linux.vnet.ibm.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 */

#include <config.h>

26
#include <fcntl.h>
D
Daniel Veillard 已提交
27 28
#include <sched.h>
#include <sys/utsname.h>
D
David L. Leskovec 已提交
29
#include <stdbool.h>
D
Daniel Veillard 已提交
30 31
#include <string.h>
#include <sys/types.h>
32 33 34
#include <sys/socket.h>
#include <sys/un.h>
#include <sys/poll.h>
D
Daniel Veillard 已提交
35 36 37
#include <unistd.h>
#include <wait.h>

38
#include "virterror_internal.h"
39
#include "logging.h"
40
#include "datatypes.h"
D
Daniel Veillard 已提交
41
#include "lxc_conf.h"
42
#include "lxc_container.h"
D
Daniel Veillard 已提交
43
#include "lxc_driver.h"
44
#include "memory.h"
45
#include "util.h"
46 47
#include "bridge.h"
#include "veth.h"
48
#include "event.h"
49
#include "nodeinfo.h"
50
#include "uuid.h"
51
#include "stats_linux.h"
52

D
Daniel Veillard 已提交
53

54 55
#define VIR_FROM_THIS VIR_FROM_LXC

56 57 58 59 60 61 62 63
typedef struct _lxcDomainObjPrivate lxcDomainObjPrivate;
typedef lxcDomainObjPrivate *lxcDomainObjPrivatePtr;
struct _lxcDomainObjPrivate {
    int monitor;
    int monitorWatch;
};


64
static int lxcStartup(int privileged);
65
static int lxcShutdown(void);
66
static lxc_driver_t *lxc_driver = NULL;
D
Daniel Veillard 已提交
67 68 69

/* Functions */

70 71
static void lxcDriverLock(lxc_driver_t *driver)
{
72
    virMutexLock(&driver->lock);
73 74 75
}
static void lxcDriverUnlock(lxc_driver_t *driver)
{
76
    virMutexUnlock(&driver->lock);
77 78
}

79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
static void *lxcDomainObjPrivateAlloc(void)
{
    lxcDomainObjPrivatePtr priv;

    if (VIR_ALLOC(priv) < 0)
        return NULL;

    priv->monitor = -1;
    priv->monitorWatch = -1;

    return priv;
}

static void lxcDomainObjPrivateFree(void *data)
{
    lxcDomainObjPrivatePtr priv = data;

    VIR_FREE(priv);
}


100 101 102 103
static void lxcDomainEventFlush(int timer, void *opaque);
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                virDomainEventPtr event);

104

D
Daniel Veillard 已提交
105 106 107 108 109
static virDrvOpenStatus lxcOpen(virConnectPtr conn,
                                virConnectAuthPtr auth ATTRIBUTE_UNUSED,
                                int flags ATTRIBUTE_UNUSED)
{
    /* Verify uri was specified */
110
    if (conn->uri == NULL) {
111 112
        if (lxc_driver == NULL)
            return VIR_DRV_OPEN_DECLINED;
113

114 115
        conn->uri = xmlParseURI("lxc:///");
        if (!conn->uri) {
116
            virReportOOMError();
117 118
            return VIR_DRV_OPEN_ERROR;
        }
119 120 121 122 123 124 125 126 127 128
    } else {
        if (conn->uri->scheme == NULL ||
            STRNEQ(conn->uri->scheme, "lxc"))
            return VIR_DRV_OPEN_DECLINED;

        /* Leave for remote driver */
        if (conn->uri->server != NULL)
            return VIR_DRV_OPEN_DECLINED;

        /* If path isn't '/' then they typoed, tell them correct path */
129 130
        if (conn->uri->path != NULL &&
            STRNEQ(conn->uri->path, "/")) {
131
            lxcError(VIR_ERR_INTERNAL_ERROR,
132
                     _("Unexpected LXC URI path '%s', try lxc:///"),
133 134 135
                     conn->uri->path);
            return VIR_DRV_OPEN_ERROR;
        }
D
Daniel Veillard 已提交
136

137 138
        /* URI was good, but driver isn't active */
        if (lxc_driver == NULL) {
139
            lxcError(VIR_ERR_INTERNAL_ERROR,
140
                     "%s", _("lxc state driver is not active"));
141 142 143
            return VIR_DRV_OPEN_ERROR;
        }
    }
144

145
    conn->privateData = lxc_driver;
D
Daniel Veillard 已提交
146 147 148 149 150 151

    return VIR_DRV_OPEN_SUCCESS;
}

static int lxcClose(virConnectPtr conn)
{
152 153 154 155 156 157
    lxc_driver_t *driver = conn->privateData;

    lxcDriverLock(driver);
    virDomainEventCallbackListRemoveConn(conn, driver->domainEventCallbacks);
    lxcDriverUnlock(driver);

158 159
    conn->privateData = NULL;
    return 0;
D
Daniel Veillard 已提交
160 161
}

162 163 164 165 166 167 168 169 170 171 172 173 174 175 176

static int lxcIsSecure(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Trivially secure, since always inside the daemon */
    return 1;
}


static int lxcIsEncrypted(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Not encrypted, but remote driver takes care of that */
    return 0;
}


177 178 179 180 181 182
static char *lxcGetCapabilities(virConnectPtr conn) {
    lxc_driver_t *driver = conn->privateData;
    char *xml;

    lxcDriverLock(driver);
    if ((xml = virCapabilitiesFormatXML(driver->caps)) == NULL)
183
        virReportOOMError();
184 185 186 187 188 189
    lxcDriverUnlock(driver);

    return xml;
}


D
Daniel Veillard 已提交
190 191 192
static virDomainPtr lxcDomainLookupByID(virConnectPtr conn,
                                        int id)
{
193 194 195
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
196

197
    lxcDriverLock(driver);
198
    vm = virDomainFindByID(&driver->domains, id);
199 200
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
201
    if (!vm) {
202
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
203
        goto cleanup;
D
Daniel Veillard 已提交
204 205 206
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
207
    if (dom)
D
Daniel Veillard 已提交
208 209
        dom->id = vm->def->id;

210
cleanup:
211 212
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
213 214 215 216 217 218
    return dom;
}

static virDomainPtr lxcDomainLookupByUUID(virConnectPtr conn,
                                          const unsigned char *uuid)
{
219 220 221
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
222

223
    lxcDriverLock(driver);
224
    vm = virDomainFindByUUID(&driver->domains, uuid);
225 226
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
227
    if (!vm) {
228
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
229
        goto cleanup;
D
Daniel Veillard 已提交
230 231 232
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
233
    if (dom)
D
Daniel Veillard 已提交
234 235
        dom->id = vm->def->id;

236
cleanup:
237 238
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
239 240 241 242 243 244
    return dom;
}

static virDomainPtr lxcDomainLookupByName(virConnectPtr conn,
                                          const char *name)
{
245 246 247
    lxc_driver_t *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
D
Daniel Veillard 已提交
248

249
    lxcDriverLock(driver);
250
    vm = virDomainFindByName(&driver->domains, name);
251
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
252
    if (!vm) {
253
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
254
        goto cleanup;
D
Daniel Veillard 已提交
255 256 257
    }

    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
258
    if (dom)
D
Daniel Veillard 已提交
259 260
        dom->id = vm->def->id;

261
cleanup:
262 263
    if (vm)
        virDomainObjUnlock(vm);
D
Daniel Veillard 已提交
264 265 266
    return dom;
}

267 268 269 270 271 272 273 274 275 276 277

static int lxcDomainIsActive(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
278
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
        goto cleanup;
    }
    ret = virDomainObjIsActive(obj);

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


static int lxcDomainIsPersistent(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    lxcDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!obj) {
300
        lxcError(VIR_ERR_NO_DOMAIN, NULL);
301 302 303 304 305 306 307 308 309 310 311
        goto cleanup;
    }
    ret = obj->persistent;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}


312
static int lxcListDomains(virConnectPtr conn, int *ids, int nids) {
313
    lxc_driver_t *driver = conn->privateData;
314
    int n;
315

316
    lxcDriverLock(driver);
317
    n = virDomainObjListGetActiveIDs(&driver->domains, ids, nids);
318
    lxcDriverUnlock(driver);
319

320
    return n;
D
Daniel Veillard 已提交
321
}
322

323
static int lxcNumDomains(virConnectPtr conn) {
324
    lxc_driver_t *driver = conn->privateData;
325
    int n;
326

327
    lxcDriverLock(driver);
328
    n = virDomainObjListNumOfDomains(&driver->domains, 1);
329
    lxcDriverUnlock(driver);
330

331
    return n;
D
Daniel Veillard 已提交
332 333 334
}

static int lxcListDefinedDomains(virConnectPtr conn,
335
                                 char **const names, int nnames) {
336
    lxc_driver_t *driver = conn->privateData;
337
    int n;
338

339
    lxcDriverLock(driver);
340
    n = virDomainObjListGetInactiveNames(&driver->domains, names, nnames);
341
    lxcDriverUnlock(driver);
342

343
    return n;
D
Daniel Veillard 已提交
344 345 346
}


347
static int lxcNumDefinedDomains(virConnectPtr conn) {
348
    lxc_driver_t *driver = conn->privateData;
349
    int n;
350

351
    lxcDriverLock(driver);
352
    n = virDomainObjListNumOfDomains(&driver->domains, 0);
353
    lxcDriverUnlock(driver);
354

355
    return n;
D
Daniel Veillard 已提交
356 357
}

358 359


D
Daniel Veillard 已提交
360 361
static virDomainPtr lxcDomainDefine(virConnectPtr conn, const char *xml)
{
362 363
    lxc_driver_t *driver = conn->privateData;
    virDomainDefPtr def = NULL;
364
    virDomainObjPtr vm = NULL;
365
    virDomainPtr dom = NULL;
366
    virDomainEventPtr event = NULL;
367
    int dupVM;
D
Daniel Veillard 已提交
368

369
    lxcDriverLock(driver);
370
    if (!(def = virDomainDefParseString(driver->caps, xml,
371
                                        VIR_DOMAIN_XML_INACTIVE)))
372
        goto cleanup;
D
Daniel Veillard 已提交
373

374 375
   if ((dupVM = virDomainObjIsDuplicate(&driver->domains, def, 0)) < 0)
        goto cleanup;
376

377
    if ((def->nets != NULL) && !(driver->have_netns)) {
378
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
379
                 "%s", _("System lacks NETNS support"));
380
        goto cleanup;
381 382
    }

383
    if (!(vm = virDomainAssignDef(driver->caps,
384
                                  &driver->domains, def)))
385 386
        goto cleanup;
    def = NULL;
387
    vm->persistent = 1;
D
Daniel Veillard 已提交
388

389
    if (virDomainSaveConfig(driver->configDir,
390
                            vm->newDef ? vm->newDef : vm->def) < 0) {
391
        virDomainRemoveInactive(&driver->domains, vm);
392
        vm = NULL;
393
        goto cleanup;
D
Daniel Veillard 已提交
394 395
    }

396 397
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
398
                                     !dupVM ?
399 400 401
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                     VIR_DOMAIN_EVENT_DEFINED_UPDATED);

D
Daniel Veillard 已提交
402
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
403
    if (dom)
D
Daniel Veillard 已提交
404 405
        dom->id = vm->def->id;

406 407
cleanup:
    virDomainDefFree(def);
408 409
    if (vm)
        virDomainObjUnlock(vm);
410 411
    if (event)
        lxcDomainEventQueue(driver, event);
412
    lxcDriverUnlock(driver);
D
Daniel Veillard 已提交
413 414 415 416 417
    return dom;
}

static int lxcDomainUndefine(virDomainPtr dom)
{
418 419
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
420
    virDomainEventPtr event = NULL;
421
    int ret = -1;
D
Daniel Veillard 已提交
422

423
    lxcDriverLock(driver);
424
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel Veillard 已提交
425
    if (!vm) {
426
        lxcError(VIR_ERR_INVALID_DOMAIN,
427
                 "%s", _("No domain with matching uuid"));
428
        goto cleanup;
D
Daniel Veillard 已提交
429 430
    }

D
Daniel P. Berrange 已提交
431
    if (virDomainObjIsActive(vm)) {
432
        lxcError(VIR_ERR_OPERATION_INVALID,
433
                 "%s", _("Cannot delete active domain"));
434
        goto cleanup;
D
Daniel Veillard 已提交
435 436
    }

437
    if (!vm->persistent) {
438
        lxcError(VIR_ERR_OPERATION_INVALID,
439
                 "%s", _("Cannot undefine transient domain"));
440
        goto cleanup;
441
    }
D
Daniel Veillard 已提交
442

443
    if (virDomainDeleteConfig(driver->configDir,
444
                              driver->autostartDir,
445 446
                              vm) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
447

448 449 450 451
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_UNDEFINED,
                                     VIR_DOMAIN_EVENT_UNDEFINED_REMOVED);

452
    virDomainRemoveInactive(&driver->domains, vm);
453
    vm = NULL;
454
    ret = 0;
D
Daniel Veillard 已提交
455

456
cleanup:
457 458
    if (vm)
        virDomainObjUnlock(vm);
459 460
    if (event)
        lxcDomainEventQueue(driver, event);
461
    lxcDriverUnlock(driver);
462
    return ret;
D
Daniel Veillard 已提交
463 464 465 466 467
}

static int lxcDomainGetInfo(virDomainPtr dom,
                            virDomainInfoPtr info)
{
468 469
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
470
    virCgroupPtr cgroup = NULL;
471
    int ret = -1;
D
Daniel Veillard 已提交
472

473
    lxcDriverLock(driver);
474
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
475

D
Daniel Veillard 已提交
476
    if (!vm) {
477
        lxcError(VIR_ERR_INVALID_DOMAIN,
478
                 "%s", _("No domain with matching uuid"));
479
        goto cleanup;
D
Daniel Veillard 已提交
480 481 482 483
    }

    info->state = vm->state;

D
Daniel P. Berrange 已提交
484
    if (!virDomainObjIsActive(vm) || driver->cgroup == NULL) {
D
Daniel Veillard 已提交
485
        info->cpuTime = 0;
R
Ryota Ozaki 已提交
486
        info->memory = vm->def->memory;
D
Daniel Veillard 已提交
487
    } else {
488
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
489
            lxcError(VIR_ERR_INTERNAL_ERROR,
490
                     _("Unable to get cgroup for %s"), vm->def->name);
491 492 493 494
            goto cleanup;
        }

        if (virCgroupGetCpuacctUsage(cgroup, &(info->cpuTime)) < 0) {
495
            lxcError(VIR_ERR_OPERATION_FAILED,
496
                     "%s", _("Cannot read cputime for domain"));
R
Ryota Ozaki 已提交
497 498 499
            goto cleanup;
        }
        if (virCgroupGetMemoryUsage(cgroup, &(info->memory)) < 0) {
500
            lxcError(VIR_ERR_OPERATION_FAILED,
501
                     "%s", _("Cannot read memory usage for domain"));
502 503
            goto cleanup;
        }
D
Daniel Veillard 已提交
504 505
    }

506
    info->maxMem = vm->def->maxmem;
D
Daniel Veillard 已提交
507
    info->nrVirtCpu = 1;
508
    ret = 0;
D
Daniel Veillard 已提交
509

510
cleanup:
511
    lxcDriverUnlock(driver);
512 513
    if (cgroup)
        virCgroupFree(&cgroup);
514 515
    if (vm)
        virDomainObjUnlock(vm);
516
    return ret;
D
Daniel Veillard 已提交
517 518
}

519
static char *lxcGetOSType(virDomainPtr dom)
D
Daniel Veillard 已提交
520
{
521 522 523
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
524

525
    lxcDriverLock(driver);
526
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
527 528
    lxcDriverUnlock(driver);

529
    if (!vm) {
530
        lxcError(VIR_ERR_INVALID_DOMAIN,
531
                 "%s", _("No domain with matching uuid"));
532
        goto cleanup;
533 534
    }

535 536
    ret = strdup(vm->def->os.type);

537
    if (ret == NULL)
538
        virReportOOMError();
539

540
cleanup:
541 542
    if (vm)
        virDomainObjUnlock(vm);
543
    return ret;
D
Daniel Veillard 已提交
544 545
}

R
Ryota Ozaki 已提交
546 547 548 549 550 551 552 553 554 555 556 557 558
/* Returns max memory in kb, 0 if error */
static unsigned long lxcDomainGetMaxMemory(virDomainPtr dom) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned long ret = 0;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
559
        lxcError(VIR_ERR_NO_DOMAIN,
560
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583
        goto cleanup;
    }

    ret = vm->def->maxmem;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMaxMemory(virDomainPtr dom, unsigned long newmax) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
584
        lxcError(VIR_ERR_NO_DOMAIN,
585
                         _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
586 587 588 589
        goto cleanup;
    }

    if (newmax < vm->def->memory) {
590
        lxcError(VIR_ERR_INVALID_ARG,
591
                         "%s", _("Cannot set max memory lower than current memory"));
R
Ryota Ozaki 已提交
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615
        goto cleanup;
    }

    vm->def->maxmem = newmax;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetMemory(virDomainPtr dom, unsigned long newmem) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virCgroupPtr cgroup = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
616
        lxcError(VIR_ERR_NO_DOMAIN,
617
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
618 619 620 621
        goto cleanup;
    }

    if (newmem > vm->def->maxmem) {
622
        lxcError(VIR_ERR_INVALID_ARG,
623
                 "%s", _("Cannot set memory higher than max memory"));
R
Ryota Ozaki 已提交
624 625 626
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
627
    if (virDomainObjIsActive(vm)) {
R
Ryota Ozaki 已提交
628
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
629
            lxcError(VIR_ERR_INTERNAL_ERROR,
R
Ryota Ozaki 已提交
630 631 632 633 634
                     _("Unable to get cgroup for %s\n"), vm->def->name);
            goto cleanup;
        }

        if (virCgroupSetMemory(cgroup, newmem) < 0) {
635
            lxcError(VIR_ERR_OPERATION_FAILED,
636
                     "%s", _("Failed to set memory for domain"));
R
Ryota Ozaki 已提交
637 638 639 640 641 642 643 644 645 646 647 648 649 650 651
            goto cleanup;
        }
    } else {
        vm->def->memory = newmem;
    }
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    if (cgroup)
        virCgroupFree(&cgroup);
    return ret;
}

D
Daniel Veillard 已提交
652
static char *lxcDomainDumpXML(virDomainPtr dom,
653
                              int flags)
D
Daniel Veillard 已提交
654
{
655 656 657
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
D
Daniel Veillard 已提交
658

659
    lxcDriverLock(driver);
660
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
661 662
    lxcDriverUnlock(driver);

D
Daniel Veillard 已提交
663
    if (!vm) {
664
        lxcError(VIR_ERR_INVALID_DOMAIN,
665
                 "%s", _("No domain with matching uuid"));
666
        goto cleanup;
D
Daniel Veillard 已提交
667 668
    }

669
    ret = virDomainDefFormat((flags & VIR_DOMAIN_XML_INACTIVE) &&
670 671 672 673
                             vm->newDef ? vm->newDef : vm->def,
                             flags);

cleanup:
674 675
    if (vm)
        virDomainObjUnlock(vm);
676
    return ret;
D
Daniel Veillard 已提交
677 678
}

679 680 681

/**
 * lxcVmCleanup:
682 683 684
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to VM to clean up
685 686 687 688 689 690 691
 *
 * waitpid() on the container process.  kill and wait the tty process
 * This is called by both lxcDomainDestroy and lxcSigHandler when a
 * container exits.
 *
 * Returns 0 on success or -1 in case of error
 */
692
static int lxcVmCleanup(lxc_driver_t *driver,
693
                        virDomainObjPtr  vm)
694 695 696 697
{
    int rc = -1;
    int waitRc;
    int childStatus = -1;
D
Dan Smith 已提交
698
    virCgroupPtr cgroup;
699
    int i;
700
    lxcDomainObjPrivatePtr priv = vm->privateData;
701 702 703 704 705 706

    while (((waitRc = waitpid(vm->pid, &childStatus, 0)) == -1) &&
           errno == EINTR)
        ; /* empty */

    if ((waitRc != vm->pid) && (errno != ECHILD)) {
707
        virReportSystemError(errno,
708 709
                             _("waitpid failed to wait for container %d: %d"),
                             vm->pid, waitRc);
710 711 712 713 714 715 716 717 718
    }

    rc = 0;

    if (WIFEXITED(childStatus)) {
        rc = WEXITSTATUS(childStatus);
        DEBUG("container exited with rc: %d", rc);
    }

719 720
    virEventRemoveHandle(priv->monitorWatch);
    close(priv->monitor);
721 722

    virFileDeletePid(driver->stateDir, vm->def->name);
723
    virDomainDeleteConfig(driver->stateDir, NULL, vm);
724 725 726 727

    vm->state = VIR_DOMAIN_SHUTOFF;
    vm->pid = -1;
    vm->def->id = -1;
728 729
    priv->monitor = -1;
    priv->monitorWatch = -1;
730

731 732 733
    for (i = 0 ; i < vm->def->nnets ; i++) {
        vethInterfaceUpOrDown(vm->def->nets[i]->ifname, 0);
        vethDelete(vm->def->nets[i]->ifname);
734 735
    }

736 737
    if (driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0) {
D
Dan Smith 已提交
738 739 740 741
        virCgroupRemove(cgroup);
        virCgroupFree(&cgroup);
    }

742 743 744 745 746 747 748
    if (vm->newDef) {
        virDomainDefFree(vm->def);
        vm->def = vm->newDef;
        vm->def->id = -1;
        vm->newDef = NULL;
    }

749 750 751
    return rc;
}

752 753
/**
 * lxcSetupInterfaces:
754
 * @conn: pointer to connection
755
 * @def: pointer to virtual machine structure
756 757
 * @nveths: number of interfaces
 * @veths: interface names
758 759 760 761 762 763 764 765
 *
 * Sets up the container interfaces by creating the veth device pairs and
 * attaching the parent end to the appropriate bridge.  The container end
 * will moved into the container namespace later after clone has been called.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcSetupInterfaces(virConnectPtr conn,
766
                              virDomainDefPtr def,
767 768
                              unsigned int *nveths,
                              char ***veths)
769
{
770
    int rc = -1, i;
771
    char *bridge = NULL;
772 773
    char parentVeth[PATH_MAX] = "";
    char containerVeth[PATH_MAX] = "";
774
    brControl *brctl = NULL;
775

776
    if (brInit(&brctl) != 0)
777 778
        return -1;

779 780
    for (i = 0 ; i < def->nnets ; i++) {
        switch (def->nets[i]->type) {
781 782 783
        case VIR_DOMAIN_NET_TYPE_NETWORK:
        {
            virNetworkPtr network = virNetworkLookupByName(conn,
784
                                                           def->nets[i]->data.network.name);
785 786 787 788 789 790 791
            if (!network) {
                goto error_exit;
            }

            bridge = virNetworkGetBridgeName(network);

            virNetworkFree(network);
792 793 794
            break;
        }
        case VIR_DOMAIN_NET_TYPE_BRIDGE:
795
            bridge = def->nets[i]->data.bridge.brname;
796
            break;
797 798 799 800
        }

        DEBUG("bridge: %s", bridge);
        if (NULL == bridge) {
801
            lxcError(VIR_ERR_INTERNAL_ERROR,
802
                     "%s", _("Failed to get bridge for interface"));
803 804 805 806
            goto error_exit;
        }

        DEBUG0("calling vethCreate()");
807 808
        if (NULL != def->nets[i]->ifname) {
            strcpy(parentVeth, def->nets[i]->ifname);
809 810 811
        }
        DEBUG("parentVeth: %s, containerVeth: %s", parentVeth, containerVeth);
        if (0 != (rc = vethCreate(parentVeth, PATH_MAX, containerVeth, PATH_MAX))) {
812
            lxcError(VIR_ERR_INTERNAL_ERROR,
813
                     _("Failed to create veth device pair: %d"), rc);
814 815
            goto error_exit;
        }
816 817
        if (NULL == def->nets[i]->ifname) {
            def->nets[i]->ifname = strdup(parentVeth);
818
        }
819
        if (VIR_REALLOC_N(*veths, (*nveths)+1) < 0) {
820
            virReportOOMError();
821
            goto error_exit;
822 823
        }
        if (((*veths)[(*nveths)] = strdup(containerVeth)) == NULL) {
824
            virReportOOMError();
825
            goto error_exit;
826 827
        }
        (*nveths)++;
828

829
        if (NULL == def->nets[i]->ifname) {
830
            virReportOOMError();
831 832 833
            goto error_exit;
        }

834
        {
835 836 837
            char macaddr[VIR_MAC_STRING_BUFLEN];
            virFormatMacAddr(def->nets[i]->mac, macaddr);
            if (0 != (rc = setMacAddr(containerVeth, macaddr))) {
838
                virReportSystemError(rc,
839
                                     _("Failed to set %s to %s"),
840 841 842 843 844
                                     macaddr, containerVeth);
                goto error_exit;
            }
        }

845
        if (0 != (rc = brAddInterface(brctl, bridge, parentVeth))) {
846
            virReportSystemError(rc,
847
                                 _("Failed to add %s device to %s"),
848
                                 parentVeth, bridge);
849 850 851 852
            goto error_exit;
        }

        if (0 != (rc = vethInterfaceUpOrDown(parentVeth, 1))) {
853
            virReportSystemError(rc,
854 855
                                 _("Failed to enable %s device"),
                                 parentVeth);
856 857 858 859 860 861 862 863
            goto error_exit;
        }

    }

    rc = 0;

error_exit:
864
    brShutdown(brctl);
865 866 867
    return rc;
}

868

869
static int lxcMonitorClient(lxc_driver_t * driver,
870
                            virDomainObjPtr vm)
871
{
872 873 874
    char *sockpath = NULL;
    int fd;
    struct sockaddr_un addr;
875

876 877
    if (virAsprintf(&sockpath, "%s/%s.sock",
                    driver->stateDir, vm->def->name) < 0) {
878
        virReportOOMError();
879 880 881 882
        return -1;
    }

    if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) < 0) {
883
        virReportSystemError(errno, "%s",
884
                             _("Failed to create client socket"));
885
        goto error;
886 887
    }

888 889
    memset(&addr, 0, sizeof(addr));
    addr.sun_family = AF_UNIX;
C
Chris Lalancette 已提交
890
    if (virStrcpyStatic(addr.sun_path, sockpath) == NULL) {
891
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
892 893 894
                 _("Socket path %s too big for destination"), sockpath);
        goto error;
    }
895 896

    if (connect(fd, (struct sockaddr *) &addr, sizeof(addr)) < 0) {
897
        virReportSystemError(errno, "%s",
898
                             _("Failed to connect to client socket"));
899
        goto error;
900 901
    }

902 903
    VIR_FREE(sockpath);
    return fd;
904

905 906 907 908 909 910 911 912
error:
    VIR_FREE(sockpath);
    if (fd != -1)
        close(fd);
    return -1;
}


913
static int lxcVmTerminate(lxc_driver_t *driver,
914
                          virDomainObjPtr vm,
915 916 917 918
                          int signum)
{
    if (signum == 0)
        signum = SIGINT;
919

920
    if (vm->pid <= 0) {
921
        lxcError(VIR_ERR_INTERNAL_ERROR,
922
                 _("Invalid PID %d for container"), vm->pid);
923 924 925
        return -1;
    }

926 927
    if (kill(vm->pid, signum) < 0) {
        if (errno != ESRCH) {
928
            virReportSystemError(errno,
929
                                 _("Failed to kill pid %d"),
930
                                 vm->pid);
931
            return -1;
932
        }
933 934
    }

935
    vm->state = VIR_DOMAIN_SHUTDOWN;
936

937
    return lxcVmCleanup(driver, vm);
938
}
939

940 941
static void lxcMonitorEvent(int watch,
                            int fd,
942 943 944
                            int events ATTRIBUTE_UNUSED,
                            void *data)
{
945 946
    lxc_driver_t *driver = lxc_driver;
    virDomainObjPtr vm = data;
947
    virDomainEventPtr event = NULL;
948
    lxcDomainObjPrivatePtr priv;
949

950
    lxcDriverLock(driver);
951 952
    virDomainObjLock(vm);
    lxcDriverUnlock(driver);
953

954 955 956
    priv = vm->privateData;

    if (priv->monitor != fd || priv->monitorWatch != watch) {
957
        virEventRemoveHandle(watch);
958
        goto cleanup;
959 960
    }

961
    if (lxcVmTerminate(driver, vm, SIGINT) < 0) {
962
        virEventRemoveHandle(watch);
963 964 965 966 967
    } else {
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
    }
968 969 970 971
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
972 973

cleanup:
974 975
    if (vm)
        virDomainObjUnlock(vm);
976 977
    if (event) {
        lxcDriverLock(driver);
978
        lxcDomainEventQueue(driver, event);
979 980
        lxcDriverUnlock(driver);
    }
981 982 983
}


984
static int lxcControllerStart(lxc_driver_t *driver,
985 986 987 988 989 990 991 992 993 994
                              virDomainObjPtr vm,
                              int nveths,
                              char **veths,
                              int appPty,
                              int logfd)
{
    int i;
    int rc;
    int largc = 0, larga = 0;
    const char **largv = NULL;
A
Amy Griffis 已提交
995 996 997 998 999
    int lenvc = 0, lenva = 0;
    const char **lenv = NULL;
    char *filterstr;
    char *outputstr;
    char *tmp;
A
Amy Griffis 已提交
1000
    int log_level;
1001 1002
    pid_t child;
    int status;
1003 1004
    fd_set keepfd;
    char appPtyStr[30];
1005
    const char *emulator;
1006 1007

    FD_ZERO(&keepfd);
1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030

#define ADD_ARG_SPACE                                                   \
    do { \
        if (largc == larga) {                                           \
            larga += 10;                                                \
            if (VIR_REALLOC_N(largv, larga) < 0)                        \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ARG(thisarg)                                                \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        largv[largc++] = thisarg;                                       \
    } while (0)

#define ADD_ARG_LIT(thisarg)                                            \
    do {                                                                \
        ADD_ARG_SPACE;                                                  \
        if ((largv[largc++] = strdup(thisarg)) == NULL)                 \
            goto no_memory;                                             \
    } while (0)

A
Amy Griffis 已提交
1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054
#define ADD_ENV_SPACE                                                   \
    do {                                                                \
        if (lenvc == lenva) {                                           \
            lenva += 10;                                                \
            if (VIR_REALLOC_N(lenv, lenva) < 0)                         \
                goto no_memory;                                         \
        }                                                               \
    } while (0)

#define ADD_ENV(thisarg)                                                \
    do {                                                                \
        ADD_ENV_SPACE;                                                  \
        lenv[lenvc++] = thisarg;                                        \
    } while (0)

#define ADD_ENV_PAIR(envname, val)                                      \
    do {                                                                \
        char *envval;                                                   \
        ADD_ENV_SPACE;                                                  \
        if (virAsprintf(&envval, "%s=%s", envname, val) < 0)            \
            goto no_memory;                                             \
        lenv[lenvc++] = envval;                                         \
    } while (0)

1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067
#define ADD_ENV_COPY(envname)                                           \
    do {                                                                \
        char *val = getenv(envname);                                    \
        if (val != NULL) {                                              \
            ADD_ENV_PAIR(envname, val);                                 \
        }                                                               \
    } while (0)

    /*
     * The controller may call ip command, so we have to remain PATH.
     */
    ADD_ENV_COPY("PATH");

A
Amy Griffis 已提交
1068 1069
    log_level = virLogGetDefaultPriority();
    if (virAsprintf(&tmp, "LIBVIRT_DEBUG=%d", log_level) < 0)
A
Amy Griffis 已提交
1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080
        goto no_memory;
    ADD_ENV(tmp);

    if (virLogGetNbFilters() > 0) {
        filterstr = virLogGetFilters();
        if (!filterstr)
            goto no_memory;
        ADD_ENV_PAIR("LIBVIRT_LOG_FILTERS", filterstr);
        VIR_FREE(filterstr);
    }

A
Amy Griffis 已提交
1081 1082 1083 1084 1085 1086 1087 1088 1089 1090
    if (driver->log_libvirtd) {
        if (virLogGetNbOutputs() > 0) {
            outputstr = virLogGetOutputs();
            if (!outputstr)
                goto no_memory;
            ADD_ENV_PAIR("LIBVIRT_LOG_OUTPUTS", outputstr);
            VIR_FREE(outputstr);
        }
    } else {
        if (virAsprintf(&tmp, "LIBVIRT_LOG_OUTPUTS=%d:stderr", log_level) < 0)
A
Amy Griffis 已提交
1091
            goto no_memory;
A
Amy Griffis 已提交
1092
        ADD_ENV(tmp);
A
Amy Griffis 已提交
1093 1094 1095 1096
    }

    ADD_ENV(NULL);

1097 1098
    snprintf(appPtyStr, sizeof(appPtyStr), "%d", appPty);

1099 1100 1101
    emulator = vm->def->emulator;

    ADD_ARG_LIT(emulator);
1102 1103 1104
    ADD_ARG_LIT("--name");
    ADD_ARG_LIT(vm->def->name);
    ADD_ARG_LIT("--console");
1105
    ADD_ARG_LIT(appPtyStr);
1106 1107 1108 1109 1110 1111 1112 1113 1114
    ADD_ARG_LIT("--background");

    for (i = 0 ; i < nveths ; i++) {
        ADD_ARG_LIT("--veth");
        ADD_ARG_LIT(veths[i]);
    }

    ADD_ARG(NULL);

1115 1116
    FD_SET(appPty, &keepfd);

1117
    if (virExec(largv, lenv, &keepfd, &child,
1118
                -1, &logfd, &logfd,
1119 1120 1121 1122 1123 1124 1125 1126 1127
                VIR_EXEC_NONE) < 0)
        goto cleanup;

    /* We now wait for the process to exit - the controller
     * will fork() itself into the background - waiting for
     * it to exit thus guarentees it has written its pidfile
     */
    while ((rc = waitpid(child, &status, 0) == -1) && errno == EINTR);
    if (rc == -1) {
1128
        virReportSystemError(errno,
1129
                             _("Cannot wait for '%s'"),
1130
                             largv[0]);
1131 1132 1133 1134
        goto cleanup;
    }

    if (!(WIFEXITED(status) && WEXITSTATUS(status) == 0)) {
1135
        lxcError(VIR_ERR_INTERNAL_ERROR,
1136
                 _("Container '%s' unexpectedly shutdown during startup"),
1137 1138 1139 1140 1141 1142 1143
                 largv[0]);
        goto cleanup;
    }

#undef ADD_ARG
#undef ADD_ARG_LIT
#undef ADD_ARG_SPACE
A
Amy Griffis 已提交
1144 1145
#undef ADD_ENV_SPACE
#undef ADD_ENV_PAIR
1146

A
Amy Griffis 已提交
1147
    return 0;
1148 1149

no_memory:
1150
    virReportOOMError();
A
Amy Griffis 已提交
1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162
cleanup:
    if (largv) {
        for (i = 0 ; i < largc ; i++)
            VIR_FREE(largv[i]);
        VIR_FREE(largv);
    }
    if (lenv) {
        for (i=0 ; i < lenvc ; i++)
            VIR_FREE(lenv[i]);
        VIR_FREE(lenv);
    }
    return -1;
1163 1164 1165
}


1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177
/**
 * lxcVmStart:
 * @conn: pointer to connection
 * @driver: pointer to driver structure
 * @vm: pointer to virtual machine structure
 *
 * Starts a vm
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcVmStart(virConnectPtr conn,
                      lxc_driver_t * driver,
1178
                      virDomainObjPtr  vm)
1179
{
1180
    int rc = -1, r;
1181 1182
    unsigned int i;
    int parentTty;
1183
    char *parentTtyPath = NULL;
1184 1185 1186 1187
    char *logfile = NULL;
    int logfd = -1;
    unsigned int nveths = 0;
    char **veths = NULL;
1188
    lxcDomainObjPrivatePtr priv = vm->privateData;
1189

L
Laine Stump 已提交
1190
    if ((r = virFileMakePath(driver->logDir)) != 0) {
1191
        virReportSystemError(r,
1192
                             _("Cannot create log directory '%s'"),
1193
                             driver->logDir);
1194 1195
        return -1;
    }
1196

1197 1198
    if (virAsprintf(&logfile, "%s/%s.log",
                    driver->logDir, vm->def->name) < 0) {
1199
        virReportOOMError();
1200
        return -1;
1201 1202
    }

1203
    /* open parent tty */
1204
    if (virFileOpenTty(&parentTty, &parentTtyPath, 1) < 0) {
1205
        virReportSystemError(errno, "%s",
1206
                             _("Failed to allocate tty"));
1207 1208
        goto cleanup;
    }
1209 1210 1211 1212 1213 1214 1215
    if (vm->def->console &&
        vm->def->console->type == VIR_DOMAIN_CHR_TYPE_PTY) {
        VIR_FREE(vm->def->console->data.file.path);
        vm->def->console->data.file.path = parentTtyPath;
    } else {
        VIR_FREE(parentTtyPath);
    }
1216

1217
    if (lxcSetupInterfaces(conn, vm->def, &nveths, &veths) != 0)
1218
        goto cleanup;
1219

1220
    /* Persist the live configuration now we have veth & tty info */
1221
    if (virDomainSaveConfig(driver->stateDir, vm->def) < 0)
1222 1223
        goto cleanup;

1224
    if ((logfd = open(logfile, O_WRONLY | O_APPEND | O_CREAT,
1225
             S_IRUSR|S_IWUSR)) < 0) {
1226
        virReportSystemError(errno,
1227
                             _("Failed to open '%s'"),
1228
                             logfile);
1229
        goto cleanup;
1230 1231
    }

1232
    if (lxcControllerStart(driver,
1233 1234 1235
                           vm,
                           nveths, veths,
                           parentTty, logfd) < 0)
1236
        goto cleanup;
1237 1238 1239 1240

    /* Connect to the controller as a client *first* because
     * this will block until the child has written their
     * pid file out to disk */
1241
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0)
1242 1243
        goto cleanup;

1244
    /* And get its pid */
1245
    if ((r = virFileReadPid(driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1246
        virReportSystemError(r,
1247 1248
                             _("Failed to read pid file %s/%s.pid"),
                             driver->stateDir, vm->def->name);
1249
        goto cleanup;
1250
    }
1251

1252
    vm->def->id = vm->pid;
1253 1254
    vm->state = VIR_DOMAIN_RUNNING;

1255 1256
    if ((priv->monitorWatch = virEventAddHandle(
             priv->monitor,
1257 1258
             VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
             lxcMonitorEvent,
1259
             vm, NULL)) < 0) {
1260
        lxcVmTerminate(driver, vm, 0);
1261 1262
        goto cleanup;
    }
1263

1264 1265 1266 1267 1268 1269 1270 1271
    rc = 0;

cleanup:
    for (i = 0 ; i < nveths ; i++) {
        if (rc != 0)
            vethDelete(veths[i]);
        VIR_FREE(veths[i]);
    }
1272 1273 1274
    if (rc != 0 && priv->monitor != -1) {
        close(priv->monitor);
        priv->monitor = -1;
1275 1276 1277 1278 1279 1280
    }
    if (parentTty != -1)
        close(parentTty);
    if (logfd != -1)
        close(logfd);
    VIR_FREE(logfile);
1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293
    return rc;
}

/**
 * lxcDomainStart:
 * @dom: domain to start
 *
 * Looks up domain and starts it.
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainStart(virDomainPtr dom)
{
1294 1295
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1296
    virDomainEventPtr event = NULL;
1297
    int ret = -1;
1298

1299
    lxcDriverLock(driver);
1300
    vm = virDomainFindByName(&driver->domains, dom->name);
1301
    if (!vm) {
1302
        lxcError(VIR_ERR_INVALID_DOMAIN,
1303
                 _("No domain named %s"), dom->name);
1304 1305 1306
        goto cleanup;
    }

1307
    if ((vm->def->nets != NULL) && !(driver->have_netns)) {
1308
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1309
                 "%s", _("System lacks NETNS support"));
1310 1311 1312
        goto cleanup;
    }

1313
    ret = lxcVmStart(dom->conn, driver, vm);
1314

1315 1316 1317 1318 1319
    if (ret == 0)
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);

1320
cleanup:
1321 1322
    if (vm)
        virDomainObjUnlock(vm);
1323 1324
    if (event)
        lxcDomainEventQueue(driver, event);
1325
    lxcDriverUnlock(driver);
1326
    return ret;
1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342
}

/**
 * lxcDomainCreateAndStart:
 * @conn: pointer to connection
 * @xml: XML definition of domain
 * @flags: Unused
 *
 * Creates a domain based on xml and starts it
 *
 * Returns 0 on success or -1 in case of error
 */
static virDomainPtr
lxcDomainCreateAndStart(virConnectPtr conn,
                        const char *xml,
                        unsigned int flags ATTRIBUTE_UNUSED) {
1343
    lxc_driver_t *driver = conn->privateData;
1344
    virDomainObjPtr vm = NULL;
1345
    virDomainDefPtr def;
1346
    virDomainPtr dom = NULL;
1347
    virDomainEventPtr event = NULL;
1348

1349
    lxcDriverLock(driver);
1350
    if (!(def = virDomainDefParseString(driver->caps, xml,
1351
                                        VIR_DOMAIN_XML_INACTIVE)))
1352
        goto cleanup;
1353

1354 1355
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
1356

1357
    if ((def->nets != NULL) && !(driver->have_netns)) {
1358
        lxcError(VIR_ERR_NO_SUPPORT,
J
Jim Meyering 已提交
1359
                 "%s", _("System lacks NETNS support"));
1360
        goto cleanup;
1361 1362
    }

1363

1364
    if (!(vm = virDomainAssignDef(driver->caps,
1365
                                  &driver->domains, def)))
1366 1367
        goto cleanup;
    def = NULL;
1368 1369

    if (lxcVmStart(conn, driver, vm) < 0) {
1370
        virDomainRemoveInactive(&driver->domains, vm);
1371
        vm = NULL;
1372
        goto cleanup;
1373 1374
    }

1375 1376 1377 1378
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);

1379
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
1380
    if (dom)
1381 1382
        dom->id = vm->def->id;

1383 1384
cleanup:
    virDomainDefFree(def);
1385 1386
    if (vm)
        virDomainObjUnlock(vm);
1387 1388
    if (event)
        lxcDomainEventQueue(driver, event);
1389
    lxcDriverUnlock(driver);
1390 1391 1392 1393 1394
    return dom;
}

/**
 * lxcDomainShutdown:
1395
 * @dom: pointer to domain to shutdown
1396 1397 1398 1399 1400 1401 1402
 *
 * Sends SIGINT to container root process to request it to shutdown
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainShutdown(virDomainPtr dom)
{
1403 1404
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1405
    virDomainEventPtr event = NULL;
1406
    int ret = -1;
1407

1408
    lxcDriverLock(driver);
1409
    vm = virDomainFindByID(&driver->domains, dom->id);
1410
    if (!vm) {
1411
        lxcError(VIR_ERR_INVALID_DOMAIN,
1412
                 _("No domain with id %d"), dom->id);
1413
        goto cleanup;
1414 1415
    }

1416
    ret = lxcVmTerminate(driver, vm, 0);
1417 1418 1419
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);
1420 1421 1422 1423
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1424 1425

cleanup:
1426 1427
    if (vm)
        virDomainObjUnlock(vm);
1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446
    if (event)
        lxcDomainEventQueue(driver, event);
    lxcDriverUnlock(driver);
    return ret;
}


static int
lxcDomainEventRegister (virConnectPtr conn,
                        virConnectDomainEventCallback callback,
                        void *opaque,
                        virFreeCallback freecb)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    ret = virDomainEventCallbackListAdd(conn, driver->domainEventCallbacks,
                                        callback, opaque, freecb);
1447
    lxcDriverUnlock(driver);
1448

1449
    return ret;
1450 1451
}

1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524
static int
lxcDomainEventDeregister (virConnectPtr conn,
                          virConnectDomainEventCallback callback)
{
    lxc_driver_t *driver = conn->privateData;
    int ret;

    lxcDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDelete(conn, driver->domainEventCallbacks,
                                                   callback);
    else
        ret = virDomainEventCallbackListRemove(conn, driver->domainEventCallbacks,
                                               callback);
    lxcDriverUnlock(driver);

    return ret;
}

static void lxcDomainEventDispatchFunc(virConnectPtr conn,
                                       virDomainEventPtr event,
                                       virConnectDomainEventCallback cb,
                                       void *cbopaque,
                                       void *opaque)
{
    lxc_driver_t *driver = opaque;

    /* Drop the lock whle dispatching, for sake of re-entrancy */
    lxcDriverUnlock(driver);
    virDomainEventDispatchDefaultFunc(conn, event, cb, cbopaque, NULL);
    lxcDriverLock(driver);
}


static void lxcDomainEventFlush(int timer ATTRIBUTE_UNUSED, void *opaque)
{
    lxc_driver_t *driver = opaque;
    virDomainEventQueue tempQueue;

    lxcDriverLock(driver);

    driver->domainEventDispatching = 1;

    /* Copy the queue, so we're reentrant safe */
    tempQueue.count = driver->domainEventQueue->count;
    tempQueue.events = driver->domainEventQueue->events;
    driver->domainEventQueue->count = 0;
    driver->domainEventQueue->events = NULL;

    virEventUpdateTimeout(driver->domainEventTimer, -1);
    virDomainEventQueueDispatch(&tempQueue,
                                driver->domainEventCallbacks,
                                lxcDomainEventDispatchFunc,
                                driver);

    /* Purge any deleted callbacks */
    virDomainEventCallbackListPurgeMarked(driver->domainEventCallbacks);

    driver->domainEventDispatching = 0;
    lxcDriverUnlock(driver);
}


/* driver must be locked before calling */
static void lxcDomainEventQueue(lxc_driver_t *driver,
                                 virDomainEventPtr event)
{
    if (virDomainEventQueuePush(driver->domainEventQueue,
                                event) < 0)
        virDomainEventFree(event);
    if (lxc_driver->domainEventQueue->count == 1)
        virEventUpdateTimeout(driver->domainEventTimer, 0);
}
1525 1526 1527

/**
 * lxcDomainDestroy:
1528
 * @dom: pointer to domain to destroy
1529 1530 1531 1532 1533 1534 1535
 *
 * Sends SIGKILL to container root process to terminate the container
 *
 * Returns 0 on success or -1 in case of error
 */
static int lxcDomainDestroy(virDomainPtr dom)
{
1536 1537
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
1538
    virDomainEventPtr event = NULL;
1539
    int ret = -1;
1540

1541
    lxcDriverLock(driver);
1542
    vm = virDomainFindByID(&driver->domains, dom->id);
1543
    if (!vm) {
1544
        lxcError(VIR_ERR_INVALID_DOMAIN,
1545
                 _("No domain with id %d"), dom->id);
1546
        goto cleanup;
1547 1548
    }

1549
    ret = lxcVmTerminate(driver, vm, SIGKILL);
1550 1551 1552
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_DESTROYED);
1553 1554 1555 1556
    if (!vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
1557 1558

cleanup:
1559 1560
    if (vm)
        virDomainObjUnlock(vm);
1561 1562
    if (event)
        lxcDomainEventQueue(driver, event);
1563
    lxcDriverUnlock(driver);
1564
    return ret;
1565
}
1566

1567 1568 1569 1570 1571
static int lxcCheckNetNsSupport(void)
{
    const char *argv[] = {"ip", "link", "set", "lo", "netns", "-1", NULL};
    int ip_rc;

1572
    if (virRun(argv, &ip_rc) < 0 ||
1573 1574
        !(WIFEXITED(ip_rc) && (WEXITSTATUS(ip_rc) != 255)))
        return 0;
1575

1576 1577
    if (lxcContainerAvailable(LXC_CONTAINER_FEATURE_NET) < 0)
        return 0;
1578

1579
    return 1;
1580 1581
}

1582

1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595
struct lxcAutostartData {
    lxc_driver_t *driver;
    virConnectPtr conn;
};

static void
lxcAutostartDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    const struct lxcAutostartData *data = opaque;

    virDomainObjLock(vm);
    if (vm->autostart &&
D
Daniel P. Berrange 已提交
1596
        !virDomainObjIsActive(vm)) {
1597 1598 1599
        int ret = lxcVmStart(data->conn, data->driver, vm);
        if (ret < 0) {
            virErrorPtr err = virGetLastError();
1600
            VIR_ERROR(_("Failed to autostart VM '%s': %s"),
1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614
                      vm->def->name,
                      err ? err->message : "");
        } else {
            virDomainEventPtr event =
                virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_BOOTED);
            if (event)
                lxcDomainEventQueue(data->driver, event);
        }
    }
    virDomainObjUnlock(vm);
}

1615 1616 1617 1618 1619 1620 1621 1622 1623 1624
static void
lxcAutostartConfigs(lxc_driver_t *driver) {
    /* XXX: Figure out a better way todo this. The domain
     * startup code needs a connection handle in order
     * to lookup the bridge associated with a virtual
     * network
     */
    virConnectPtr conn = virConnectOpen("lxc:///");
    /* Ignoring NULL conn which is mostly harmless here */

1625 1626
    struct lxcAutostartData data = { driver, conn };

1627
    lxcDriverLock(driver);
1628
    virHashForEach(driver->domains.objs, lxcAutostartDomain, &data);
1629 1630 1631 1632 1633 1634
    lxcDriverUnlock(driver);

    if (conn)
        virConnectClose(conn);
}

1635 1636 1637 1638 1639 1640 1641
static void
lxcReconnectVM(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    lxc_driver_t *driver = opaque;
    char *config = NULL;
    virDomainDefPtr tmp;
1642
    lxcDomainObjPrivatePtr priv;
1643 1644

    virDomainObjLock(vm);
1645 1646

    priv = vm->privateData;
1647
    if ((priv->monitor = lxcMonitorClient(driver, vm)) < 0) {
1648 1649 1650 1651 1652
        goto cleanup;
    }

    /* Read pid from controller */
    if ((virFileReadPid(lxc_driver->stateDir, vm->def->name, &vm->pid)) != 0) {
1653 1654
        close(priv->monitor);
        priv->monitor = -1;
1655 1656 1657
        goto cleanup;
    }

1658
    if ((config = virDomainConfigFile(driver->stateDir,
1659 1660 1661 1662
                                      vm->def->name)) == NULL)
        goto cleanup;

    /* Try and load the live config */
1663
    tmp = virDomainDefParseFile(driver->caps, config, 0);
1664 1665 1666 1667 1668 1669 1670 1671 1672
    VIR_FREE(config);
    if (tmp) {
        vm->newDef = vm->def;
        vm->def = tmp;
    }

    if (vm->pid != 0) {
        vm->def->id = vm->pid;
        vm->state = VIR_DOMAIN_RUNNING;
1673 1674 1675 1676 1677 1678

        if ((priv->monitorWatch = virEventAddHandle(
                 priv->monitor,
                 VIR_EVENT_HANDLE_ERROR | VIR_EVENT_HANDLE_HANGUP,
                 lxcMonitorEvent,
                 vm, NULL)) < 0) {
1679
            lxcVmTerminate(driver, vm, 0);
1680 1681
            goto cleanup;
        }
1682 1683
    } else {
        vm->def->id = -1;
1684 1685
        close(priv->monitor);
        priv->monitor = -1;
1686 1687 1688 1689 1690 1691
    }

cleanup:
    virDomainObjUnlock(vm);
}

1692

1693
static int lxcStartup(int privileged)
D
Daniel Veillard 已提交
1694
{
1695
    char *ld;
1696
    int rc;
1697 1698 1699 1700 1701 1702

    /* Valgrind gets very annoyed when we clone containers, so
     * disable LXC when under valgrind
     * XXX remove this when valgrind is fixed
     */
    ld = getenv("LD_PRELOAD");
1703 1704 1705 1706
    if (ld && strstr(ld, "vgpreload")) {
        VIR_INFO0("Running under valgrind, disabling driver");
        return 0;
    }
1707

1708
    /* Check that the user is root, silently disable if not */
1709
    if (!privileged) {
1710 1711 1712 1713 1714 1715 1716 1717
        VIR_INFO0("Not running privileged, disabling driver");
        return 0;
    }

    /* Check that this is a container enabled kernel */
    if (lxcContainerAvailable(0) < 0) {
        VIR_INFO0("LXC support not available in this kernel, disabling driver");
        return 0;
1718 1719
    }

1720
    if (VIR_ALLOC(lxc_driver) < 0) {
1721 1722
        return -1;
    }
1723 1724 1725 1726
    if (virMutexInit(&lxc_driver->lock) < 0) {
        VIR_FREE(lxc_driver);
        return -1;
    }
1727
    lxcDriverLock(lxc_driver);
D
Daniel Veillard 已提交
1728

1729 1730 1731
    if (virDomainObjListInit(&lxc_driver->domains) < 0)
        goto cleanup;

1732
    if (VIR_ALLOC(lxc_driver->domainEventCallbacks) < 0)
1733 1734 1735 1736 1737 1738 1739 1740
        goto cleanup;
    if (!(lxc_driver->domainEventQueue = virDomainEventQueueNew()))
        goto cleanup;

    if ((lxc_driver->domainEventTimer =
         virEventAddTimeout(-1, lxcDomainEventFlush, lxc_driver, NULL)) < 0)
        goto cleanup;

A
Amy Griffis 已提交
1741
    lxc_driver->log_libvirtd = 0; /* by default log to container logfile */
1742
    lxc_driver->have_netns = lxcCheckNetNsSupport();
D
Daniel Veillard 已提交
1743

1744 1745 1746 1747 1748 1749 1750
    rc = virCgroupForDriver("lxc", &lxc_driver->cgroup, privileged, 1);
    if (rc < 0) {
        char buf[1024];
        VIR_WARN("Unable to create cgroup for driver: %s",
                 virStrerror(-rc, buf, sizeof(buf)));
    }

D
Daniel Veillard 已提交
1751
    /* Call function to load lxc driver configuration information */
1752 1753
    if (lxcLoadDriverConfig(lxc_driver) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
1754

1755 1756
    if ((lxc_driver->caps = lxcCapsInit()) == NULL)
        goto cleanup;
D
Daniel Veillard 已提交
1757

1758 1759 1760
    lxc_driver->caps->privateDataAllocFunc = lxcDomainObjPrivateAlloc;
    lxc_driver->caps->privateDataFreeFunc = lxcDomainObjPrivateFree;

1761
    if (virDomainLoadAllConfigs(lxc_driver->caps,
1762 1763
                                &lxc_driver->domains,
                                lxc_driver->configDir,
1764
                                lxc_driver->autostartDir,
1765
                                0, NULL, NULL) < 0)
1766
        goto cleanup;
1767

1768
    virHashForEach(lxc_driver->domains.objs, lxcReconnectVM, lxc_driver);
1769

1770
    lxcDriverUnlock(lxc_driver);
D
Daniel Veillard 已提交
1771 1772
    return 0;

1773 1774 1775 1776
cleanup:
    lxcDriverUnlock(lxc_driver);
    lxcShutdown();
    return -1;
D
Daniel Veillard 已提交
1777 1778
}

1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804
static void lxcNotifyLoadDomain(virDomainObjPtr vm, int newVM, void *opaque)
{
    lxc_driver_t *driver = opaque;

    if (newVM) {
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED);
        if (event)
            lxcDomainEventQueue(driver, event);
    }
}

/**
 * lxcReload:
 *
 * Function to restart the LXC driver, it will recheck the configuration
 * files and perform autostart
 */
static int
lxcReload(void) {
    if (!lxc_driver)
        return 0;

    lxcDriverLock(lxc_driver);
1805
    virDomainLoadAllConfigs(lxc_driver->caps,
1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816
                            &lxc_driver->domains,
                            lxc_driver->configDir,
                            lxc_driver->autostartDir,
                            0, lxcNotifyLoadDomain, lxc_driver);
    lxcDriverUnlock(lxc_driver);

    lxcAutostartConfigs(lxc_driver);

    return 0;
}

1817
static int lxcShutdown(void)
D
Daniel Veillard 已提交
1818
{
1819
    if (lxc_driver == NULL)
1820
        return(-1);
1821

1822
    lxcDriverLock(lxc_driver);
1823
    virDomainObjListDeinit(&lxc_driver->domains);
1824

1825 1826 1827 1828 1829 1830
    virDomainEventCallbackListFree(lxc_driver->domainEventCallbacks);
    virDomainEventQueueFree(lxc_driver->domainEventQueue);

    if (lxc_driver->domainEventTimer != -1)
        virEventRemoveTimeout(lxc_driver->domainEventTimer);

1831 1832 1833 1834 1835 1836
    virCapabilitiesFree(lxc_driver->caps);
    VIR_FREE(lxc_driver->configDir);
    VIR_FREE(lxc_driver->autostartDir);
    VIR_FREE(lxc_driver->stateDir);
    VIR_FREE(lxc_driver->logDir);
    lxcDriverUnlock(lxc_driver);
1837
    virMutexDestroy(&lxc_driver->lock);
1838
    VIR_FREE(lxc_driver);
1839 1840 1841

    return 0;
}
D
Daniel Veillard 已提交
1842

1843 1844 1845 1846 1847 1848 1849 1850 1851
/**
 * lxcActive:
 *
 * Checks if the LXC daemon is active, i.e. has an active domain
 *
 * Returns 1 if active, 0 otherwise
 */
static int
lxcActive(void) {
1852
    int active;
1853

1854 1855
    if (lxc_driver == NULL)
        return(0);
1856

1857
    lxcDriverLock(lxc_driver);
1858
    active = virDomainObjListNumOfDomains(&lxc_driver->domains, 1);
1859
    lxcDriverUnlock(lxc_driver);
1860

1861
    return active;
D
Daniel Veillard 已提交
1862 1863
}

1864
static int lxcVersion(virConnectPtr conn ATTRIBUTE_UNUSED, unsigned long *version)
D
Dan Smith 已提交
1865 1866 1867 1868 1869 1870
{
    struct utsname ver;
    int maj;
    int min;
    int rev;

1871
    uname(&ver);
D
Dan Smith 已提交
1872 1873

    if (sscanf(ver.release, "%i.%i.%i", &maj, &min, &rev) != 3) {
1874
        lxcError(VIR_ERR_INTERNAL_ERROR,
D
Dan Smith 已提交
1875 1876 1877 1878 1879 1880 1881 1882
                 _("Unknown release: %s"), ver.release);
        return -1;
    }

    *version = (maj * 1000 * 1000) + (min * 1000) + rev;

    return 0;
}
1883

1884 1885
static char *lxcGetSchedulerType(virDomainPtr domain ATTRIBUTE_UNUSED,
                                 int *nparams)
1886
{
1887 1888
    char *schedulerType = NULL;

1889 1890 1891
    if (nparams)
        *nparams = 1;

1892 1893 1894
    schedulerType = strdup("posix");

    if (schedulerType == NULL)
1895
        virReportOOMError();
1896 1897

    return schedulerType;
1898 1899
}

1900
static int lxcSetSchedulerParameters(virDomainPtr domain,
1901 1902 1903
                                     virSchedParameterPtr params,
                                     int nparams)
{
1904
    lxc_driver_t *driver = domain->conn->privateData;
1905
    int i;
1906 1907 1908
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;
1909

1910
    if (driver->cgroup == NULL)
1911 1912 1913 1914
        return -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
1915

1916
    if (vm == NULL) {
1917
        lxcError(VIR_ERR_INTERNAL_ERROR,
1918 1919
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
1920 1921
    }

1922
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
1923
        goto cleanup;
1924 1925 1926

    for (i = 0; i < nparams; i++) {
        virSchedParameterPtr param = &params[i];
1927
        if (param->type != VIR_DOMAIN_SCHED_FIELD_ULLONG) {
1928
            lxcError(VIR_ERR_INVALID_ARG, "%s",
1929
                     _("Invalid type for cpu_shares tunable, expected a 'ullong'"));
1930 1931
            goto cleanup;
        }
1932 1933

        if (STREQ(param->field, "cpu_shares")) {
1934
            if (virCgroupSetCpuShares(group, params[i].value.ul) != 0)
1935
                goto cleanup;
1936
        } else {
1937
            lxcError(VIR_ERR_INVALID_ARG,
1938
                     _("Invalid parameter `%s'"), param->field);
1939
            goto cleanup;
1940 1941
        }
    }
1942
    ret = 0;
1943

1944
cleanup:
1945
    lxcDriverUnlock(driver);
1946
    virCgroupFree(&group);
1947 1948
    if (vm)
        virDomainObjUnlock(vm);
1949
    return ret;
1950 1951
}

1952
static int lxcGetSchedulerParameters(virDomainPtr domain,
1953 1954 1955
                                     virSchedParameterPtr params,
                                     int *nparams)
{
1956
    lxc_driver_t *driver = domain->conn->privateData;
1957 1958
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
1959
    unsigned long long val;
1960
    int ret = -1;
1961

1962
    if (driver->cgroup == NULL)
1963
        return -1;
1964 1965

    if ((*nparams) != 1) {
1966
        lxcError(VIR_ERR_INVALID_ARG,
J
Jim Meyering 已提交
1967
                 "%s", _("Invalid parameter count"));
1968
        return -1;
1969 1970
    }

1971 1972 1973
    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);

1974
    if (vm == NULL) {
1975
        lxcError(VIR_ERR_INTERNAL_ERROR,
1976 1977
                 _("No such domain %s"), domain->uuid);
        goto cleanup;
1978 1979
    }

1980
    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0)
1981
        goto cleanup;
1982

1983 1984
    if (virCgroupGetCpuShares(group, &val) != 0)
        goto cleanup;
1985
    params[0].value.ul = val;
C
Chris Lalancette 已提交
1986
    if (virStrcpyStatic(params[0].field, "cpu_shares") == NULL) {
1987
        lxcError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
1988 1989 1990
                 "%s", _("Field cpu_shares too big for destination"));
        goto cleanup;
    }
1991 1992
    params[0].type = VIR_DOMAIN_SCHED_FIELD_ULLONG;

1993
    ret = 0;
1994

1995
cleanup:
1996
    lxcDriverUnlock(driver);
1997
    virCgroupFree(&group);
1998 1999
    if (vm)
        virDomainObjUnlock(vm);
2000
    return ret;
2001 2002
}

2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020
#ifdef __linux__
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path,
                        struct _virDomainInterfaceStats *stats)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int i;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2021
        lxcError(VIR_ERR_NO_DOMAIN,
2022 2023 2024 2025 2026
                 _("No domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
2027
        lxcError(VIR_ERR_OPERATION_INVALID,
2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041
                 "%s", _("Domain is not running"));
        goto cleanup;
    }

    /* Check the path is one of the domain's network interfaces. */
    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (vm->def->nets[i]->ifname &&
            STREQ(vm->def->nets[i]->ifname, path)) {
            ret = 0;
            break;
        }
    }

    if (ret == 0)
2042
        ret = linuxDomainInterfaceStats(path, stats);
2043
    else
2044
        lxcError(VIR_ERR_INVALID_ARG,
2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056
                 _("Invalid path, '%s' is not a known interface"), path);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}
#else
static int
lxcDomainInterfaceStats(virDomainPtr dom,
                        const char *path ATTRIBUTE_UNUSED,
                        struct _virDomainInterfaceStats *stats ATTRIBUTE_UNUSED)
2057
    lxcError(VIR_ERR_NO_SUPPORT, "%s", __FUNCTION__);
2058 2059 2060 2061
    return -1;
}
#endif

2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074
static int lxcDomainGetAutostart(virDomainPtr dom,
                                   int *autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    lxcDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2075
        lxcError(VIR_ERR_NO_DOMAIN,
2076
                 _("No domain with matching uuid '%s'"), uuidstr);
2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101
        goto cleanup;
    }

    *autostart = vm->autostart;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

static int lxcDomainSetAutostart(virDomainPtr dom,
                                   int autostart) {
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *configFile = NULL, *autostartLink = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2102
        lxcError(VIR_ERR_NO_DOMAIN,
2103
                 _("No domain with matching uuid '%s'"), uuidstr);
2104 2105 2106 2107
        goto cleanup;
    }

    if (!vm->persistent) {
2108
        lxcError(VIR_ERR_INTERNAL_ERROR,
2109
                 "%s", _("Cannot set autostart for transient domain"));
2110 2111 2112 2113 2114
        goto cleanup;
    }

    autostart = (autostart != 0);

2115 2116 2117 2118
    if (vm->autostart == autostart) {
        ret = 0;
        goto cleanup;
    }
2119

2120
    configFile = virDomainConfigFile(driver->configDir,
2121 2122 2123
                                     vm->def->name);
    if (configFile == NULL)
        goto cleanup;
2124
    autostartLink = virDomainConfigFile(driver->autostartDir,
2125 2126 2127
                                        vm->def->name);
    if (autostartLink == NULL)
        goto cleanup;
2128

2129 2130
    if (autostart) {
        int err;
2131

2132
        if ((err = virFileMakePath(driver->autostartDir))) {
2133
            virReportSystemError(err,
2134 2135 2136
                                 _("Cannot create autostart directory %s"),
                                 driver->autostartDir);
            goto cleanup;
2137 2138
        }

2139
        if (symlink(configFile, autostartLink) < 0) {
2140
            virReportSystemError(errno,
2141 2142 2143 2144 2145 2146
                                 _("Failed to create symlink '%s to '%s'"),
                                 autostartLink, configFile);
            goto cleanup;
        }
    } else {
        if (unlink(autostartLink) < 0 && errno != ENOENT && errno != ENOTDIR) {
2147
            virReportSystemError(errno,
2148 2149 2150 2151
                                 _("Failed to delete symlink '%s'"),
                                 autostartLink);
            goto cleanup;
        }
2152
    }
2153 2154

    vm->autostart = autostart;
2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165
    ret = 0;

cleanup:
    VIR_FREE(configFile);
    VIR_FREE(autostartLink);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

R
Ryota Ozaki 已提交
2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270
static int lxcFreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int timeout = 1000; /* In milliseconds */
    int check_interval = 1; /* In milliseconds */
    int exp = 10;
    int waited_time = 0;
    int ret = -1;
    char *state = NULL;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    while (waited_time < timeout) {
        int r;
        /*
         * Writing "FROZEN" to the "freezer.state" freezes the group,
         * i.e., the container, temporarily transiting "FREEZING" state.
         * Once the freezing is completed, the state of the group transits
         * to "FROZEN".
         * (see linux-2.6/Documentation/cgroups/freezer-subsystem.txt)
         */
        r = virCgroupSetFreezerState(cgroup, "FROZEN");

        /*
         * Returning EBUSY explicitly indicates that the group is
         * being freezed but incomplete and other errors are true
         * errors.
         */
        if (r < 0 && r != -EBUSY) {
            VIR_DEBUG("Writing freezer.state failed with errno: %d", r);
            goto error;
        }
        if (r == -EBUSY)
            VIR_DEBUG0("Writing freezer.state gets EBUSY");

        /*
         * Unfortunately, returning 0 (success) is likely to happen
         * even when the freezing has not been completed. Sometimes
         * the state of the group remains "FREEZING" like when
         * returning -EBUSY and even worse may never transit to
         * "FROZEN" even if writing "FROZEN" again.
         *
         * So we don't trust the return value anyway and always
         * decide that the freezing has been complete only with
         * the state actually transit to "FROZEN".
         */
        usleep(check_interval * 1000);

        r = virCgroupGetFreezerState(cgroup, &state);

        if (r < 0) {
            VIR_DEBUG("Reading freezer.state failed with errno: %d", r);
            goto error;
        }
        VIR_DEBUG("Read freezer.state: %s", state);

        if (STREQ(state, "FROZEN")) {
            ret = 0;
            goto cleanup;
        }

        waited_time += check_interval;
        /*
         * Increasing check_interval exponentially starting with
         * small initial value treats nicely two cases; One is
         * a container is under no load and waiting for long period
         * makes no sense. The other is under heavy load. The container
         * may stay longer time in FREEZING or never transit to FROZEN.
         * In that case, eager polling will just waste CPU time.
         */
        check_interval *= exp;
        VIR_FREE(state);
    }
    VIR_DEBUG0("lxcFreezeContainer timeout");
error:
    /*
     * If timeout or an error on reading the state occurs,
     * activate the group again and return an error.
     * This is likely to fall the group back again gracefully.
     */
    virCgroupSetFreezerState(cgroup, "THAWED");
    ret = -1;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);
    VIR_FREE(state);
    return ret;
}

static int lxcDomainSuspend(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2271
        lxcError(VIR_ERR_NO_DOMAIN,
2272
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2273 2274 2275
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2276
    if (!virDomainObjIsActive(vm)) {
2277
        lxcError(VIR_ERR_OPERATION_INVALID,
2278
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2279 2280 2281 2282 2283
        goto cleanup;
    }

    if (vm->state != VIR_DOMAIN_PAUSED) {
        if (lxcFreezeContainer(driver, vm) < 0) {
2284
            lxcError(VIR_ERR_OPERATION_FAILED,
2285
                     "%s", _("Suspend operation failed"));
R
Ryota Ozaki 已提交
2286 2287 2288 2289 2290 2291 2292 2293 2294
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_PAUSED;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
    }

2295
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}

static int lxcUnfreezeContainer(lxc_driver_t *driver, virDomainObjPtr vm)
{
    int ret;
    virCgroupPtr cgroup = NULL;

    if (!(driver->cgroup &&
        virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) == 0))
        return -1;

    ret = virCgroupSetFreezerState(cgroup, "THAWED");

    virCgroupFree(&cgroup);
    return ret;
}

static int lxcDomainResume(virDomainPtr dom)
{
    lxc_driver_t *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainEventPtr event = NULL;
    int ret = -1;

    lxcDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
2336
        lxcError(VIR_ERR_NO_DOMAIN,
2337
                 _("No domain with matching uuid '%s'"), uuidstr);
R
Ryota Ozaki 已提交
2338 2339 2340
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
2341
    if (!virDomainObjIsActive(vm)) {
2342
        lxcError(VIR_ERR_OPERATION_INVALID,
2343
                 "%s", _("Domain is not running"));
R
Ryota Ozaki 已提交
2344 2345 2346 2347 2348
        goto cleanup;
    }

    if (vm->state == VIR_DOMAIN_PAUSED) {
        if (lxcUnfreezeContainer(driver, vm) < 0) {
2349
            lxcError(VIR_ERR_OPERATION_FAILED,
2350
                     "%s", _("Resume operation failed"));
R
Ryota Ozaki 已提交
2351 2352 2353 2354 2355 2356 2357 2358 2359
            goto cleanup;
        }
        vm->state = VIR_DOMAIN_RUNNING;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_UNPAUSED);
    }

2360
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
R
Ryota Ozaki 已提交
2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373
        goto cleanup;
    ret = 0;

cleanup:
    if (event)
        lxcDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    lxcDriverUnlock(driver);
    return ret;
}


D
Daniel Veillard 已提交
2374 2375 2376 2377 2378 2379 2380 2381
/* Function Tables */
static virDriver lxcDriver = {
    VIR_DRV_LXC, /* the number virDrvNo */
    "LXC", /* the name of the driver */
    lxcOpen, /* open */
    lxcClose, /* close */
    NULL, /* supports_feature */
    NULL, /* type */
D
Dan Smith 已提交
2382
    lxcVersion, /* version */
2383
    NULL, /* libvirtVersion (impl. in libvirt.c) */
2384
    virGetHostname, /* getHostname */
D
Daniel Veillard 已提交
2385
    NULL, /* getMaxVcpus */
2386 2387
    nodeGetInfo, /* nodeGetInfo */
    lxcGetCapabilities, /* getCapabilities */
D
Daniel Veillard 已提交
2388 2389
    lxcListDomains, /* listDomains */
    lxcNumDomains, /* numOfDomains */
2390
    lxcDomainCreateAndStart, /* domainCreateXML */
D
Daniel Veillard 已提交
2391 2392 2393
    lxcDomainLookupByID, /* domainLookupByID */
    lxcDomainLookupByUUID, /* domainLookupByUUID */
    lxcDomainLookupByName, /* domainLookupByName */
R
Ryota Ozaki 已提交
2394 2395
    lxcDomainSuspend, /* domainSuspend */
    lxcDomainResume, /* domainResume */
2396
    lxcDomainShutdown, /* domainShutdown */
D
Daniel Veillard 已提交
2397
    NULL, /* domainReboot */
2398
    lxcDomainDestroy, /* domainDestroy */
D
Daniel Veillard 已提交
2399
    lxcGetOSType, /* domainGetOSType */
R
Ryota Ozaki 已提交
2400 2401 2402
    lxcDomainGetMaxMemory, /* domainGetMaxMemory */
    lxcDomainSetMaxMemory, /* domainSetMaxMemory */
    lxcDomainSetMemory, /* domainSetMemory */
D
Daniel Veillard 已提交
2403 2404 2405 2406 2407 2408 2409 2410
    lxcDomainGetInfo, /* domainGetInfo */
    NULL, /* domainSave */
    NULL, /* domainRestore */
    NULL, /* domainCoreDump */
    NULL, /* domainSetVcpus */
    NULL, /* domainPinVcpu */
    NULL, /* domainGetVcpus */
    NULL, /* domainGetMaxVcpus */
2411 2412
    NULL, /* domainGetSecurityLabel */
    NULL, /* nodeGetSecurityModel */
D
Daniel Veillard 已提交
2413
    lxcDomainDumpXML, /* domainDumpXML */
2414 2415
    NULL, /* domainXMLFromNative */
    NULL, /* domainXMLToNative */
D
Daniel Veillard 已提交
2416 2417
    lxcListDefinedDomains, /* listDefinedDomains */
    lxcNumDefinedDomains, /* numOfDefinedDomains */
2418
    lxcDomainStart, /* domainCreate */
D
Daniel Veillard 已提交
2419 2420 2421
    lxcDomainDefine, /* domainDefineXML */
    lxcDomainUndefine, /* domainUndefine */
    NULL, /* domainAttachDevice */
2422
    NULL, /* domainAttachDeviceFlags */
D
Daniel Veillard 已提交
2423
    NULL, /* domainDetachDevice */
2424
    NULL, /* domainDetachDeviceFlags */
2425 2426
    lxcDomainGetAutostart, /* domainGetAutostart */
    lxcDomainSetAutostart, /* domainSetAutostart */
2427 2428 2429
    lxcGetSchedulerType, /* domainGetSchedulerType */
    lxcGetSchedulerParameters, /* domainGetSchedulerParameters */
    lxcSetSchedulerParameters, /* domainSetSchedulerParameters */
D
Daniel Veillard 已提交
2430 2431 2432 2433
    NULL, /* domainMigratePrepare */
    NULL, /* domainMigratePerform */
    NULL, /* domainMigrateFinish */
    NULL, /* domainBlockStats */
2434
    lxcDomainInterfaceStats, /* domainInterfaceStats */
2435
    NULL, /* domainMemoryStats */
D
Daniel P. Berrange 已提交
2436 2437
    NULL, /* domainBlockPeek */
    NULL, /* domainMemoryPeek */
2438 2439
    nodeGetCellsFreeMemory, /* nodeGetCellsFreeMemory */
    nodeGetFreeMemory,  /* getFreeMemory */
2440 2441
    lxcDomainEventRegister, /* domainEventRegister */
    lxcDomainEventDeregister, /* domainEventDeregister */
D
Daniel Veillard 已提交
2442 2443
    NULL, /* domainMigratePrepare2 */
    NULL, /* domainMigrateFinish2 */
2444
    NULL, /* nodeDeviceDettach */
2445 2446
    NULL, /* nodeDeviceReAttach */
    NULL, /* nodeDeviceReset */
C
Chris Lalancette 已提交
2447
    NULL, /* domainMigratePrepareTunnel */
2448 2449 2450 2451
    lxcIsEncrypted,
    lxcIsSecure,
    lxcDomainIsActive,
    lxcDomainIsPersistent,
J
Jiri Denemark 已提交
2452
    NULL, /* cpuCompare */
2453
    NULL, /* cpuBaseline */
D
Daniel Veillard 已提交
2454 2455
};

2456
static virStateDriver lxcStateDriver = {
2457
    .name = "LXC",
2458 2459 2460
    .initialize = lxcStartup,
    .cleanup = lxcShutdown,
    .active = lxcActive,
2461
    .reload = lxcReload,
2462 2463
};

D
Daniel Veillard 已提交
2464 2465 2466
int lxcRegister(void)
{
    virRegisterDriver(&lxcDriver);
2467
    virRegisterStateDriver(&lxcStateDriver);
D
Daniel Veillard 已提交
2468 2469
    return 0;
}