Queue.java 33.5 KB
Newer Older
K
kohsuke 已提交
1 2
package hudson.model;

3
import hudson.Util;
K
kohsuke 已提交
4
import hudson.XmlFile;
5
import hudson.BulkChange;
K
kohsuke 已提交
6
import hudson.model.Node.Mode;
7 8
import hudson.triggers.SafeTimerTask;
import hudson.triggers.Trigger;
K
kohsuke 已提交
9
import hudson.util.OneShotEvent;
K
kohsuke 已提交
10
import hudson.util.XStream2;
11
import hudson.util.TimeUnit2;
K
kohsuke 已提交
12

13 14 15 16 17
import java.io.BufferedReader;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
18
import java.lang.ref.WeakReference;
K
kohsuke 已提交
19 20 21 22 23 24 25 26 27 28
import java.util.ArrayList;
import java.util.Calendar;
import java.util.GregorianCalendar;
import java.util.HashMap;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.TreeSet;
29
import java.util.NoSuchElementException;
30
import java.util.concurrent.TimeUnit;
S
stephenconnolly 已提交
31
import java.util.Map.Entry;
K
kohsuke 已提交
32 33 34
import java.util.logging.Level;
import java.util.logging.Logger;

K
kohsuke 已提交
35 36 37 38 39 40 41 42 43
import javax.management.timer.Timer;

import org.acegisecurity.AccessDeniedException;
import org.kohsuke.stapler.export.Exported;
import org.kohsuke.stapler.export.ExportedBean;

import com.thoughtworks.xstream.XStream;
import com.thoughtworks.xstream.converters.basic.AbstractSingleValueConverter;

K
kohsuke 已提交
44 45
/**
 * Build queue.
46 47
 *
 * <p>
48 49
 * This class implements the core scheduling logic. {@link Task} represents the executable
 * task that are placed in the queue. While in the queue, it's wrapped into {@link Item}
50
 * so that we can keep track of additional data used for deciding what to exeucte when.
51 52
 *
 * <p>
53 54 55 56 57 58 59 60
 * Items in queue goes through several stages, as depicted below:
 * <pre>
 * (enter) --> waitingList --+--> blockedProjects
 *                           |        ^
 *                           |        |
 *                           |        v
 *                           +--> buildables ---> (executed)
 * </pre>
61 62
 *
 * <p>
63 64 65
 * In addition, at any stage, an item can be removed from the queue (for example, when the user
 * cancels a job in the queue.) See the corresponding field for their exact meanings.
 *
K
kohsuke 已提交
66 67
 * @author Kohsuke Kawaguchi
 */
68
@ExportedBean
69
public class Queue extends ResourceController implements Saveable {
K
kohsuke 已提交
70
    /**
71
     * Items that are waiting for its quiet period to pass.
72 73
     *
     * <p>
K
kohsuke 已提交
74 75 76
     * This consists of {@link Item}s that cannot be run yet
     * because its time has not yet come.
     */
77
    private final Set<WaitingItem> waitingList = new TreeSet<WaitingItem>();
K
kohsuke 已提交
78 79 80

    /**
     * {@link Project}s that can be built immediately
81 82 83
     * but blocked because another build is in progress,
     * required {@link Resource}s are not available, or otherwise blocked
     * by {@link Task#isBuildBlocked()}.
84 85
     *
     * <p>
86 87
     * Conceptually a set of {@link BlockedItem}, but we often need to look up
     * {@link BlockedItem} from {@link Task}, so organized as a map.
K
kohsuke 已提交
88
     */
89
    private final Map<Task,BlockedItem> blockedProjects = new HashMap<Task,BlockedItem>();
K
kohsuke 已提交
90 91 92 93

    /**
     * {@link Project}s that can be built immediately
     * that are waiting for available {@link Executor}.
94 95
     *
     * <p>
96 97 98
     * Conceptually, this is a list of {@link BuildableItem} (FIFO list, not a set, so that
     * the item doesn't starve in the queue), but we often need to look up
     * {@link BuildableItem} from {@link Task}, so organized as a {@link LinkedHashMap}.
K
kohsuke 已提交
99
     */
100
    private final LinkedHashMap<Task,BuildableItem> buildables = new LinkedHashMap<Task,BuildableItem>();
101

K
kohsuke 已提交
102 103 104
    /**
     * Data structure created for each idle {@link Executor}.
     * This is an offer from the queue to an executor.
105 106
     *
     * <p>
107
     * It eventually receives a {@link #item} to build.
K
kohsuke 已提交
108 109 110 111 112 113 114 115 116 117 118 119 120
     */
    private static class JobOffer {
        final Executor executor;

        /**
         * Used to wake up an executor, when it has an offered
         * {@link Project} to build.
         */
        final OneShotEvent event = new OneShotEvent();
        /**
         * The project that this {@link Executor} is going to build.
         * (Or null, in which case event is used to trigger a queue maintenance.)
         */
121
        BuildableItem item;
K
kohsuke 已提交
122 123 124 125 126

        public JobOffer(Executor executor) {
            this.executor = executor;
        }

127 128 129
        public void set(BuildableItem p) {
            assert this.item == null;
            this.item = p;
K
kohsuke 已提交
130 131 132 133
            event.signal();
        }

        public boolean isAvailable() {
134
            return item == null && !executor.getOwner().isOffline() && executor.getOwner().isAcceptingTasks();
K
kohsuke 已提交
135 136 137 138 139 140 141
        }

        public Node getNode() {
            return executor.getOwner().getNode();
        }

        public boolean isNotExclusive() {
142
            return getNode().getMode() == Mode.NORMAL;
K
kohsuke 已提交
143 144 145
        }
    }

S
stephenconnolly 已提交
146 147 148
    /**
     * The executors that are currently parked while waiting for a job to run.
     */
149
    private final Map<Executor, JobOffer> parked = new HashMap<Executor, JobOffer>();
K
kohsuke 已提交
150

151 152 153 154 155 156
    public Queue() {
        // if all the executors are busy doing something, then the queue won't be maintained in
        // timely fashion, so use another thread to make sure it happens.
        new MaintainTask(this);
    }

K
kohsuke 已提交
157 158 159 160 161
    /**
     * Loads the queue contents that was {@link #save() saved}.
     */
    public synchronized void load() {
        try {
K
TAB->WS  
kohsuke 已提交
162
            // first try the old format
K
kohsuke 已提交
163
            File queueFile = getQueueFile();
K
kohsuke 已提交
164 165
            if (queueFile.exists()) {
                BufferedReader in = new BufferedReader(new InputStreamReader(new FileInputStream(queueFile)));
K
TAB->WS  
kohsuke 已提交
166 167 168 169 170 171 172 173 174 175 176 177
                String line;
                while ((line = in.readLine()) != null) {
                    AbstractProject j = Hudson.getInstance().getItemByFullName(line, AbstractProject.class);
                    if (j != null)
                        j.scheduleBuild();
                }
                in.close();
                // discard the queue file now that we are done
                queueFile.delete();
            } else {
                queueFile = getXMLQueueFile();
                if (queueFile.exists()) {
178
                    List<Task> tasks = (List<Task>) new XmlFile(XSTREAM, queueFile).read();
K
TAB->WS  
kohsuke 已提交
179 180 181
                    for (Task task : tasks) {
                        add(task, 0);
                    }
182 183 184 185 186 187 188 189 190

                    // I just had an incident where all the executors are dead at AbstractProject._getRuns()
                    // because runs is null. Debugger revealed that this is caused by a MatrixConfiguration
                    // object that doesn't appear to be de-serialized properly.
                    // I don't know how this problem happened, but to diagnose this problem better
                    // when it happens again, save the old queue file for introspection.
                    File bk = new File(queueFile.getPath() + ".bak");
                    bk.delete();
                    queueFile.renameTo(bk);
K
TAB->WS  
kohsuke 已提交
191 192 193
                    queueFile.delete();
                }
            }
194 195
        } catch (IOException e) {
            LOGGER.log(Level.WARNING, "Failed to load the queue file " + getQueueFile(), e);
K
kohsuke 已提交
196 197 198 199 200 201 202
        }
    }

    /**
     * Persists the queue contents to the disk.
     */
    public synchronized void save() {
203 204
        if(BulkChange.contains(this))  return;
        
K
kohsuke 已提交
205 206 207
        // write out the tasks on the queue
    	ArrayList<Task> tasks = new ArrayList<Task>();
    	for (Item item: getItems()) {
K
TAB->WS  
kohsuke 已提交
208
    	    tasks.add(item.task);
K
kohsuke 已提交
209 210
    	}
    	
K
kohsuke 已提交
211
        try {
212
            new XmlFile(XSTREAM, getXMLQueueFile()).write(tasks);
213 214
        } catch (IOException e) {
            LOGGER.log(Level.WARNING, "Failed to write out the queue file " + getQueueFile(), e);
K
kohsuke 已提交
215 216 217
        }
    }

218 219 220 221 222 223 224 225 226 227
    /**
     * Wipes out all the items currently in the queue, as if all of them are cancelled at once.
     */
    public synchronized void clear() {
        waitingList.clear();
        blockedProjects.clear();
        buildables.clear();
        scheduleMaintenance();
    }

K
kohsuke 已提交
228
    private File getQueueFile() {
K
TAB->WS  
kohsuke 已提交
229 230
        return new File(Hudson.getInstance().getRootDir(), "queue.txt");
    }
K
kohsuke 已提交
231

232
    /*package*/ File getXMLQueueFile() {
K
TAB->WS  
kohsuke 已提交
233 234
        return new File(Hudson.getInstance().getRootDir(), "queue.xml");
    }
K
kohsuke 已提交
235 236 237

    /**
     * Schedule a new build for this project.
238
     *
239 240 241
     * @return true if the project is actually added to the queue.
     *         false if the queue contained it and therefore the add()
     *         was noop
K
kohsuke 已提交
242
     */
243 244
    public boolean add(AbstractProject p) {
        return add(p, p.getQuietPeriod());
245 246 247 248
    }

    /**
     * Schedules a new build with a custom quiet period.
249 250
     *
     * <p>
K
kohsuke 已提交
251 252
     * Left for backward compatibility with &lt;1.114.
     *
253 254
     * @since 1.105
     */
255 256
    public synchronized boolean add(AbstractProject p, int quietPeriod) {
        return add((Task) p, quietPeriod);
K
kohsuke 已提交
257 258 259 260 261
    }

    /**
     * Schedules an execution of a task.
     *
262 263 264
     * @param quietPeriod Number of seconds that the task will be placed in queue.
     *                    Useful when the same task is likely scheduled for multiple
     *                    times.
K
kohsuke 已提交
265 266
     * @since 1.114
     */
267 268 269 270
    public synchronized boolean add(Task p, int quietPeriod) {
        Item item = getItem(p);
        Calendar due = new GregorianCalendar();
        due.add(Calendar.SECOND, quietPeriod);
271
        if (item != null) {
272 273 274 275 276 277
            if (!(item instanceof WaitingItem))
                // already in the blocked or buildable stage
                // no need to requeue
                return false;

            WaitingItem wi = (WaitingItem) item;
K
kohsuke 已提交
278

279 280 281
            if(quietPeriod<=0) {
                // the user really wants to build now, and they mean NOW.
                // so let's pull in the timestamp if we can.
282
                if (wi.timestamp.before(due))
283 284 285
                    return false;
            } else {
                // otherwise we do the normal quiet period implementation
286
                if (wi.timestamp.after(due))
287
                    return false;
288
                // quiet period timer reset. start the period over again
289
            }
290 291 292 293 294

            // waitingList is sorted, so when we change a timestamp we need to maintain order
            waitingList.remove(wi);
            wi.timestamp = due;
            waitingList.add(wi);
295 296
        } else {
            LOGGER.fine(p.getName() + " added to queue");
297

298
            // put the item in the queue
299
            waitingList.add(new WaitingItem(due,p));
K
kohsuke 已提交
300

301
        }
K
kohsuke 已提交
302
        scheduleMaintenance();   // let an executor know that a new item is in the queue.
303
        return true;
K
kohsuke 已提交
304 305
    }

K
kohsuke 已提交
306 307 308
    /**
     * Cancels the item in the queue.
     *
309 310
     * @return true if the project was indeed in the queue and was removed.
     *         false if this was no-op.
K
kohsuke 已提交
311
     */
K
kohsuke 已提交
312
    public synchronized boolean cancel(Task p) {
313
        LOGGER.fine("Cancelling " + p.getName());
K
kohsuke 已提交
314 315
        for (Iterator<WaitingItem> itr = waitingList.iterator(); itr.hasNext();) {
            Item item = itr.next();
316
            if (item.task == p) {
K
kohsuke 已提交
317
                itr.remove();
K
kohsuke 已提交
318
                return true;
K
kohsuke 已提交
319 320
            }
        }
K
kohsuke 已提交
321
        // use bitwise-OR to make sure that both branches get evaluated all the time
322
        return blockedProjects.remove(p)!=null | buildables.remove(p)!=null;
K
kohsuke 已提交
323 324 325
    }

    public synchronized boolean isEmpty() {
326
        return waitingList.isEmpty() && blockedProjects.isEmpty() && buildables.isEmpty();
K
kohsuke 已提交
327 328
    }

329
    private synchronized WaitingItem peek() {
330
        return waitingList.iterator().next();
K
kohsuke 已提交
331 332 333 334 335
    }

    /**
     * Gets a snapshot of items in the queue.
     */
336
    @Exported(inline=true)
K
kohsuke 已提交
337
    public synchronized Item[] getItems() {
338 339 340
        Item[] r = new Item[waitingList.size() + blockedProjects.size() + buildables.size()];
        waitingList.toArray(r);
        int idx = waitingList.size();
341 342 343 344
        for (BlockedItem p : blockedProjects.values())
            r[idx++] = p;
        for (BuildableItem p : buildables.values())
            r[idx++] = p;
K
kohsuke 已提交
345 346 347
        return r;
    }

348 349 350 351
    public synchronized List<BuildableItem> getBuildableItems(Computer c) {
        List<BuildableItem> result = new ArrayList<BuildableItem>();
        for (BuildableItem p : buildables.values()) {
            Label l = p.task.getAssignedLabel();
352 353 354 355 356
            if (l != null) {
                // if a project has assigned label, it can be only built on it
                if (!l.contains(c.getNode()))
                    continue;
            }
357
            result.add(p);
358
        }
359
        return result;
360 361
    }

K
kohsuke 已提交
362 363 364 365 366
    /**
     * Gets the information about the queue item for the given project.
     *
     * @return null if the project is not in the queue.
     */
367 368
    public synchronized Item getItem(Task t) {
        BlockedItem bp = blockedProjects.get(t);
369
        if (bp!=null)
370 371
            return bp;
        BuildableItem bi = buildables.get(t);
372
        if(bi!=null)
373 374
            return bi;

375
        for (Item item : waitingList) {
376
            if (item.task == t)
K
kohsuke 已提交
377 378 379 380 381
                return item;
        }
        return null;
    }

382 383
    /**
     * Left for backward compatibility.
384
     *
385 386
     * @see #getItem(Task)
    public synchronized Item getItem(AbstractProject p) {
387
        return getItem((Task) p);
388
    }
K
kohsuke 已提交
389
     */
390

K
kohsuke 已提交
391
    /**
K
kohsuke 已提交
392
     * Returns true if this queue contains the said project.
K
kohsuke 已提交
393
     */
394 395
    public synchronized boolean contains(Task t) {
        if (blockedProjects.containsKey(t) || buildables.containsKey(t))
K
kohsuke 已提交
396
            return true;
397
        for (Item item : waitingList) {
398
            if (item.task == t)
K
kohsuke 已提交
399 400 401 402 403 404 405
                return true;
        }
        return false;
    }

    /**
     * Called by the executor to fetch something to build next.
406
     * <p>
K
kohsuke 已提交
407 408
     * This method blocks until a next project becomes buildable.
     */
409
    public Task pop() throws InterruptedException {
K
kohsuke 已提交
410
        final Executor exec = Executor.currentExecutor();
411

K
kohsuke 已提交
412
        try {
413
            while (true) {
K
kohsuke 已提交
414 415 416
                final JobOffer offer = new JobOffer(exec);
                long sleep = -1;

417
                synchronized (this) {
K
kohsuke 已提交
418 419
                    // consider myself parked
                    assert !parked.containsKey(exec);
420
                    parked.put(exec, offer);
K
kohsuke 已提交
421

K
kohsuke 已提交
422
                    // reuse executor thread to do a queue maintenance.
K
kohsuke 已提交
423 424 425 426 427
                    // at the end of this we get all the buildable jobs
                    // in the buildables field.
                    maintain();

                    // allocate buildable jobs to executors
428
                    Iterator<BuildableItem> itr = buildables.values().iterator();
429
                    while (itr.hasNext()) {
430
                        BuildableItem p = itr.next();
431 432

                        // one last check to make sure this build is not blocked.
433
                        if (isBuildBlocked(p.task)) {
434
                            itr.remove();
435
                            blockedProjects.put(p.task,new BlockedItem(p));
436 437
                            continue;
                        }
438

439
                        JobOffer runner = choose(p.task);
440
                        if (runner == null)
K
kohsuke 已提交
441 442 443 444 445 446 447 448 449 450 451 452 453 454 455
                            // if we couldn't find the executor that fits,
                            // just leave it in the buildables list and
                            // check if we can execute other projects
                            continue;

                        // found a matching executor. use it.
                        runner.set(p);
                        itr.remove();
                    }

                    // we went over all the buildable projects and awaken
                    // all the executors that got work to do. now, go to sleep
                    // until this thread is awakened. If this executor assigned a job to
                    // itself above, the block method will return immediately.

456
                    if (!waitingList.isEmpty()) {
K
kohsuke 已提交
457
                        // wait until the first item in the queue is due
458 459
                        sleep = peek().timestamp.getTimeInMillis() - new GregorianCalendar().getTimeInMillis();
                        if (sleep < 100) sleep = 100;    // avoid wait(0)
K
kohsuke 已提交
460 461 462 463 464
                    }
                }

                // this needs to be done outside synchronized block,
                // so that executors can maintain a queue while others are sleeping
465
                if (sleep == -1)
K
kohsuke 已提交
466 467 468 469
                    offer.event.block();
                else
                    offer.event.block(sleep);

470
                synchronized (this) {
471
                    // retract the offer object
472
                    assert parked.get(exec) == offer;
473 474
                    parked.remove(exec);

K
kohsuke 已提交
475
                    // am I woken up because I have a project to build?
476 477
                    if (offer.item != null) {
                        LOGGER.fine("Pop returning " + offer.item + " for " + exec.getName());
K
kohsuke 已提交
478
                        // if so, just build it
479
                        return offer.item.task;
K
kohsuke 已提交
480 481 482 483 484
                    }
                    // otherwise run a queue maintenance
                }
            }
        } finally {
485
            synchronized (this) {
K
kohsuke 已提交
486
                // remove myself from the parked list
487
                JobOffer offer = parked.remove(exec);
488
                if (offer != null && offer.item != null) {
489 490 491 492 493
                    // we are already assigned a project,
                    // ask for someone else to build it.
                    // note that while this thread is waiting for CPU
                    // someone else can schedule this build again,
                    // so check the contains method first.
494
                    if (!contains(offer.item.task))
495
                        buildables.put(offer.item.task,offer.item);
K
kohsuke 已提交
496
                }
497 498 499 500 501 502

                // since this executor might have been chosen for
                // maintenance, schedule another one. Worst case
                // we'll just run a pointless maintenance, and that's
                // fine.
                scheduleMaintenance();
K
kohsuke 已提交
503 504 505 506 507
            }
        }
    }

    /**
K
kohsuke 已提交
508
     * Chooses the executor to carry out the build for the given project.
K
kohsuke 已提交
509
     *
510
     * @return null if no {@link Executor} can run it.
K
kohsuke 已提交
511
     */
512
    private JobOffer choose(Task p) {
513
        if (Hudson.getInstance().isQuietingDown()) {
K
kohsuke 已提交
514 515 516 517 518
            // if we are quieting down, don't run anything so that
            // all executors will be free.
            return null;
        }

519
        Label l = p.getAssignedLabel();
520
        if (l != null) {
521
            // if a project has assigned label, it can be only built on it
K
kohsuke 已提交
522
            for (JobOffer offer : parked.values()) {
523
                if (offer.isAvailable() && l.contains(offer.getNode()))
K
kohsuke 已提交
524 525 526 527 528
                    return offer;
            }
            return null;
        }

529
        // if we are a large deployment, then we will favor slaves
530
        boolean isLargeHudson = Hudson.getInstance().getSlaves().size() > 10;
531

532
        // otherwise let's see if the last node where this project was built is available
K
kohsuke 已提交
533 534
        // it has up-to-date workspace, so that's usually preferable.
        // (but we can't use an exclusive node)
535
        Node n = p.getLastBuiltOn();
536
        if (n != null && n.getMode() == Mode.NORMAL) {
K
kohsuke 已提交
537
            for (JobOffer offer : parked.values()) {
538 539
                if (offer.isAvailable() && offer.getNode() == n) {
                    if (isLargeHudson && offer.getNode() instanceof Slave)
S
stephenconnolly 已提交
540
                        // but if we are a large Hudson, then we really do want to keep the master free from builds
541
                        continue;
K
kohsuke 已提交
542
                    return offer;
543
                }
K
kohsuke 已提交
544 545 546 547 548 549
            }
        }

        // duration of a build on a slave tends not to have an impact on
        // the master/slave communication, so that means we should favor
        // running long jobs on slaves.
550 551
        // Similarly if we have many slaves, master should be made available
        // for HTTP requests and coordination as much as possible
552
        if (isLargeHudson || p.getEstimatedDuration() > 15 * 60 * 1000) {
K
kohsuke 已提交
553 554
            // consider a long job to be > 15 mins
            for (JobOffer offer : parked.values()) {
555
                if (offer.isAvailable() && offer.getNode() instanceof Slave && offer.isNotExclusive())
K
kohsuke 已提交
556 557 558 559 560 561
                    return offer;
            }
        }

        // lastly, just look for any idle executor
        for (JobOffer offer : parked.values()) {
562
            if (offer.isAvailable() && offer.isNotExclusive())
K
kohsuke 已提交
563 564 565 566 567 568 569 570 571
                return offer;
        }

        // nothing available
        return null;
    }

    /**
     * Checks the queue and runs anything that can be run.
572 573
     *
     * <p>
K
kohsuke 已提交
574
     * When conditions are changed, this method should be invoked.
575
     * <p>
K
kohsuke 已提交
576 577 578 579 580 581 582
     * This wakes up one {@link Executor} so that it will maintain a queue.
     */
    public synchronized void scheduleMaintenance() {
        // this code assumes that after this method is called
        // no more executors will be offered job except by
        // the pop() code.
        for (Entry<Executor, JobOffer> av : parked.entrySet()) {
583
            if (av.getValue().item == null) {
K
kohsuke 已提交
584 585 586 587 588 589
                av.getValue().event.signal();
                return;
            }
        }
    }

590 591 592
    /**
     * Checks if the given task is blocked.
     */
593
    private boolean isBuildBlocked(Task t) {
594 595 596
        return t.isBuildBlocked() || !canRun(t.getResourceList());
    }

K
kohsuke 已提交
597 598

    /**
K
kohsuke 已提交
599
     * Queue maintenance.
600
     * <p>
601
     * Move projects between {@link #waitingList}, {@link #blockedProjects}, and {@link #buildables}
K
kohsuke 已提交
602 603
     * appropriately.
     */
604
    public synchronized void maintain() {
605 606
        if (LOGGER.isLoggable(Level.FINE))
            LOGGER.fine("Queue maintenance started " + this);
607

608
        Iterator<BlockedItem> itr = blockedProjects.values().iterator();
609
        while (itr.hasNext()) {
610 611
            BlockedItem p = itr.next();
            if (!isBuildBlocked(p.task)) {
K
kohsuke 已提交
612
                // ready to be executed
613
                LOGGER.fine(p.task.getName() + " no longer blocked");
K
kohsuke 已提交
614
                itr.remove();
615
                buildables.put(p.task,new BuildableItem(p));
K
kohsuke 已提交
616 617 618
            }
        }

619
        while (!waitingList.isEmpty()) {
620
            WaitingItem top = peek();
K
kohsuke 已提交
621

622
            if (!top.timestamp.before(new GregorianCalendar()))
K
kohsuke 已提交
623 624
                return; // finished moving all ready items from queue

625
            Task p = top.task;
626
            if (!isBuildBlocked(p)) {
K
kohsuke 已提交
627
                // ready to be executed immediately
628
                waitingList.remove(top);
629
                LOGGER.fine(p.getName() + " ready to build");
630
                buildables.put(p,new BuildableItem(top));
K
kohsuke 已提交
631
            } else {
632
                // this can't be built now because another build is in progress
K
kohsuke 已提交
633
                // set this project aside.
634
                waitingList.remove(top);
635
                LOGGER.fine(p.getName() + " is blocked");
636
                blockedProjects.put(p,new BlockedItem(top));
K
kohsuke 已提交
637 638 639 640
            }
        }
    }

641 642 643 644
    public Api getApi() {
        return new Api(this);
    }

K
kohsuke 已提交
645 646
    /**
     * Task whose execution is controlled by the queue.
647
     *
648
     * <p>
K
kohsuke 已提交
649 650 651
     * {@link #equals(Object) Value equality} of {@link Task}s is used
     * to collapse two tasks into one. This is used to avoid infinite
     * queue backlog.
652 653 654 655
     *
     * <p>
     * Pending {@link Task}s are persisted when Hudson shuts down, so
     * it needs to be persistable.
K
kohsuke 已提交
656
     */
657
    public interface Task extends ModelObject, ResourceActivity {
658
        /**
659 660 661
         * If this task needs to be run on a node with a particular label,
         * return that {@link Label}. Otherwise null, indicating
         * it can run on anywhere.
662
         */
663
        Label getAssignedLabel();
664 665 666 667 668 669 670 671 672 673 674

        /**
         * If the previous execution of this task run on a certain node
         * and this task prefers to run on the same node, return that.
         * Otherwise null.
         */
        Node getLastBuiltOn();

        /**
         * Returns true if the execution should be blocked
         * for temporary reasons.
675 676
         *
         * <p>
K
kohsuke 已提交
677 678
         * This can be used to define mutual exclusion that goes beyond
         * {@link #getResourceList()}.
679 680 681 682 683 684 685 686 687 688 689
         */
        boolean isBuildBlocked();

        /**
         * When {@link #isBuildBlocked()} is true, this method returns
         * human readable description of why the build is blocked.
         * Used for HTML rendering.
         */
        String getWhyBlocked();

        /**
K
kohsuke 已提交
690
         * Unique name of this task.
K
kohsuke 已提交
691
         *
692 693
         * @see hudson.model.Item#getName()
         *      TODO: this doesn't make sense anymore. remove it.
694 695 696
         */
        String getName();

697 698 699 700 701
        /**
         * @see hudson.model.Item#getFullDisplayName()
         */
        String getFullDisplayName();

702 703 704 705
        /**
         * Estimate of how long will it take to execute this task.
         * Measured in milliseconds.
         *
706
         * @return -1 if it's impossible to estimate.
707 708 709
         */
        long getEstimatedDuration();

K
kohsuke 已提交
710
        /**
711
         * Creates {@link Executable}, which performs the actual execution of the task.
K
kohsuke 已提交
712
         */
713
        Executable createExecutable() throws IOException;
714 715 716 717 718 719 720 721

        /**
         * Checks the permission to see if the current user can abort this executable.
         * Returns normally from this method if it's OK.
         *
         * @throws AccessDeniedException if the permission is not granted.
         */
        void checkAbortPermission();
K
kohsuke 已提交
722 723 724 725 726 727

        /**
         * Works just like {@link #checkAbortPermission()} except it indicates the status by a return value,
         * instead of exception.
         */
        boolean hasAbortPermission();
728 729 730 731 732
    }

    public interface Executable extends Runnable {
        /**
         * Task from which this executable was created.
K
kohsuke 已提交
733
         * Never null.
734 735 736 737 738 739 740
         */
        Task getParent();

        /**
         * Called by {@link Executor} to perform the task
         */
        void run();
741 742
    }

K
kohsuke 已提交
743 744 745
    /**
     * Item in a queue.
     */
746
    @ExportedBean(defaultVisibility = 999)
747
    public abstract class Item {
K
kohsuke 已提交
748 749 750
        /**
         * Project to be built.
         */
751
        @Exported
752
        public final Task task;
K
kohsuke 已提交
753

754
        /**
755 756 757
         * Build is blocked because another build is in progress,
         * required {@link Resource}s are not available, or otherwise blocked
         * by {@link Task#isBuildBlocked()}.
758
         */
K
kohsuke 已提交
759
        @Exported
760
        public boolean isBlocked() { return this instanceof BlockedItem; }
761 762 763 764 765 766

        /**
         * Build is waiting the executor to become available.
         * This flag is only used in {@link Queue#getItems()} for
         * 'pseudo' items that are actually not really in the queue.
         */
K
kohsuke 已提交
767
        @Exported
768
        public boolean isBuildable() { return this instanceof BuildableItem; }
769

770 771 772 773 774 775
        /**
         * True if the item is starving for an executor for too long.
         */
        @Exported
        public boolean isStuck() { return false; }

776
        protected Item(Task project) {
777
            this.task = project;
K
kohsuke 已提交
778 779
        }

780 781 782
        /**
         * Gets a human-readable status message describing why it's in the queu.
         */
K
kohsuke 已提交
783
        @Exported
784
        public abstract String getWhy();
K
kohsuke 已提交
785

786 787 788 789
        public boolean hasCancelPermission() {
            return task.hasAbortPermission();
        }
    }
790

791 792 793 794 795 796 797 798 799
    /**
     * {@link Item} in the {@link Queue#waitingList} stage.
     */
    public final class WaitingItem extends Item implements Comparable<WaitingItem> {
        /**
         * This item can be run after this time.
         */
        @Exported
        public Calendar timestamp;
800

K
kohsuke 已提交
801 802 803 804 805 806
        /**
         * Unique number of this {@link WaitingItem}.
         * Used to differentiate {@link WaitingItem}s with the same due date, to make it sortable.
         */
        public final int id;

807 808 809
        WaitingItem(Calendar timestamp, Task project) {
            super(project);
            this.timestamp = timestamp;
K
kohsuke 已提交
810 811 812
            synchronized (Queue.this) {
                this.id = iota++;
            }
813 814 815 816 817 818 819 820 821 822 823
        }

        public int compareTo(WaitingItem that) {
            int r = this.timestamp.getTime().compareTo(that.timestamp.getTime());
            if (r != 0) return r;

            return this.id - that.id;
        }

        @Override
        public String getWhy() {
824
            long diff = timestamp.getTimeInMillis() - System.currentTimeMillis();
825
            if (diff > 0)
K
i18n  
kohsuke 已提交
826
                return Messages.Queue_InQuietPeriod(Util.getTimeSpanString(diff));
827 828 829 830
            else
                return Messages.Queue_Unknown();
        }
    }
K
kohsuke 已提交
831

832 833 834 835 836 837 838 839 840 841 842 843 844
    /**
     * Common part between {@link BlockedItem} and {@link BuildableItem}.
     */
    public abstract class NotWaitingItem extends Item {
        /**
         * When did this job exit the {@link Queue#waitingList} phase?
         */
        @Exported
        public final long buildableStartMilliseconds;

        protected NotWaitingItem(WaitingItem wi) {
            super(wi.task);
            buildableStartMilliseconds = System.currentTimeMillis();
K
kohsuke 已提交
845
        }
846

847 848 849
        protected NotWaitingItem(NotWaitingItem ni) {
            super(ni.task);
            buildableStartMilliseconds = ni.buildableStartMilliseconds;
850
        }
851
    }
852

853 854 855 856 857 858 859
    /**
     * {@link Item} in the {@link Queue#blockedProjects} stage.
     */
    public final class BlockedItem extends NotWaitingItem {
        public BlockedItem(WaitingItem wi) {
            super(wi);
        }
860

861 862 863 864 865 866 867 868 869 870 871 872 873
        public BlockedItem(NotWaitingItem ni) {
            super(ni);
        }

        @Override
        public String getWhy() {
            ResourceActivity r = getBlockingActivity(task);
            if (r != null) {
                if (r == task) // blocked by itself, meaning another build is in progress
                    return Messages.Queue_InProgress();
                return Messages.Queue_BlockedBy(r.getDisplayName());
            }
            return task.getWhyBlocked();
874
        }
875
    }
876

877 878 879 880 881 882 883 884 885 886 887 888 889 890
    /**
     * {@link Item} in the {@link Queue#buildables} stage.
     */
    public final class BuildableItem extends NotWaitingItem {
        public BuildableItem(WaitingItem wi) {
            super(wi);
        }

        public BuildableItem(NotWaitingItem ni) {
            super(ni);
        }

        @Override
        public String getWhy() {
891
            Label label = task.getAssignedLabel();
892 893
            Hudson hudson = Hudson.getInstance();
            if (hudson.getSlaves().isEmpty())
894
                label = null;    // no master/slave. pointless to talk about nodes
895 896

            String name = null;
897 898 899 900
            if (label != null) {
                name = label.getName();
                if (label.isOffline()) {
                    if (label.getNodes().size() > 1)
K
i18n  
kohsuke 已提交
901
                        return Messages.Queue_AllNodesOffline(name);
902
                    else
K
i18n  
kohsuke 已提交
903
                        return Messages.Queue_NodeOffline(name);
904 905 906
                }
            }

K
i18n  
kohsuke 已提交
907 908 909 910
            if(name==null)
                return Messages.Queue_WaitingForNextAvailableExecutor();
            else
                return Messages.Queue_WaitingForNextAvailableExecutorOn(name);
911
        }
912 913 914 915 916 917 918 919 920 921 922 923 924 925 926

        @Override
        public boolean isStuck() {
            Label label = task.getAssignedLabel();
            if(label!=null && label.isOffline())
                // no executor online to process this job. definitely stuck.
                return true;

            long d = task.getEstimatedDuration();
            long elapsed = System.currentTimeMillis()-buildableStartMilliseconds;
            if(d>=0) {
                // if we were running elsewhere, we would have done this build twice.
                return elapsed > d*2;
            } else {
                // more than a day in the queue
927
                return TimeUnit2.MILLISECONDS.toHours(elapsed)>24;
928 929
            }
        }
K
kohsuke 已提交
930 931 932 933 934
    }

    /**
     * Unique number generator
     */
935
    private int iota = 0;
K
kohsuke 已提交
936 937

    private static final Logger LOGGER = Logger.getLogger(Queue.class.getName());
938

939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992
    /**
     * This {@link XStream} instance is used to persist {@link Task}s.
     */
    public static final XStream XSTREAM = new XStream2();

    static {
        XSTREAM.registerConverter(new AbstractSingleValueConverter() {

			@Override
			@SuppressWarnings("unchecked")
			public boolean canConvert(Class klazz) {
				return hudson.model.Item.class.isAssignableFrom(klazz);
			}

			@Override
			public Object fromString(String string) {
                Object item = Hudson.getInstance().getItemByFullName(string);
                if(item==null)  throw new NoSuchElementException("No such job exists: "+string);
                return item;
			}

			@Override
			public String toString(Object item) {
				return ((hudson.model.Item) item).getFullName();
			}
        });
        XSTREAM.registerConverter(new AbstractSingleValueConverter() {

			@SuppressWarnings("unchecked")
			@Override
			public boolean canConvert(Class klazz) {
				return Run.class.isAssignableFrom(klazz);
			}

			@Override
			public Object fromString(String string) {
				String[] split = string.split("#");
				String projectName = split[0];
				int buildNumber = Integer.parseInt(split[1]);
				Job<?,?> job = (Job<?,?>) Hudson.getInstance().getItemByFullName(projectName);
                if(job==null)  throw new NoSuchElementException("No such job exists: "+projectName);
				Run<?,?> run = job.getBuildByNumber(buildNumber);
                if(job==null)  throw new NoSuchElementException("No such build: "+string);
				return run;
			}

			@Override
			public String toString(Object object) {
				Run<?,?> run = (Run<?,?>) object;
				return run.getParent().getFullName() + "#" + run.getNumber();
			}
        });
    }

993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008
    /**
     * Regularly invokes {@link Queue#maintain()} and clean itself up when
     * {@link Queue} gets GC-ed.
     */
    private static class MaintainTask extends SafeTimerTask {
        private final WeakReference<Queue> queue;

        MaintainTask(Queue queue) {
            this.queue = new WeakReference<Queue>(queue);

            long interval = 5 * Timer.ONE_SECOND;
            Trigger.timer.schedule(this, interval, interval);
        }

        protected void doRun() {
            Queue q = queue.get();
1009
            if (q != null)
1010 1011 1012 1013 1014
                q.maintain();
            else
                cancel();
        }
    }
K
kohsuke 已提交
1015
}