SlaveComputer.java 30.8 KB
Newer Older
K
kohsuke 已提交
1 2
/*
 * The MIT License
3
 *
K
kohsuke 已提交
4
 * Copyright (c) 2004-2009, Sun Microsystems, Inc., Kohsuke Kawaguchi, Stephen Connolly
5
 *
K
kohsuke 已提交
6 7 8 9 10 11
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
12
 *
K
kohsuke 已提交
13 14
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
15
 *
K
kohsuke 已提交
16 17 18 19 20 21 22 23
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24 25
package hudson.slaves;

26 27
import edu.umd.cs.findbugs.annotations.OverrideMustInvoke;
import edu.umd.cs.findbugs.annotations.When;
K
Kohsuke Kawaguchi 已提交
28
import hudson.AbortException;
K
Kohsuke Kawaguchi 已提交
29
import hudson.remoting.ChannelBuilder;
K
Kohsuke Kawaguchi 已提交
30
import hudson.util.IOUtils;
31
import hudson.FilePath;
K
kohsuke 已提交
32
import hudson.Util;
K
Kohsuke Kawaguchi 已提交
33 34 35 36 37 38 39 40 41
import hudson.model.Computer;
import hudson.model.Executor;
import hudson.model.ExecutorListener;
import hudson.model.Node;
import hudson.model.Queue;
import hudson.model.Slave;
import hudson.model.TaskListener;
import hudson.model.User;
import hudson.remoting.Channel;
42
import hudson.remoting.Launcher;
K
Kohsuke Kawaguchi 已提交
43
import hudson.remoting.VirtualChannel;
44
import hudson.security.ACL;
45
import hudson.slaves.OfflineCause.ChannelTermination;
K
Kohsuke Kawaguchi 已提交
46 47 48 49
import hudson.util.Futures;
import hudson.util.NullStream;
import hudson.util.RingBufferLogHandler;
import hudson.util.StreamTaskListener;
50
import hudson.util.io.ReopenableFileOutputStream;
K
Kohsuke Kawaguchi 已提交
51
import hudson.util.io.ReopenableRotatingFileOutputStream;
52
import jenkins.slaves.EncryptedSlaveAgentJnlpFile;
53
import jenkins.slaves.systemInfo.SlaveSystemInfo;
54 55
import org.acegisecurity.context.SecurityContext;
import org.acegisecurity.context.SecurityContextHolder;
56
import org.apache.commons.io.FilenameUtils;
K
Kohsuke Kawaguchi 已提交
57
import org.kohsuke.stapler.WebMethod;
K
Kohsuke Kawaguchi 已提交
58
import org.kohsuke.stapler.interceptor.RequirePOST;
59

K
Kohsuke Kawaguchi 已提交
60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76
import javax.servlet.ServletException;
import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.io.PrintStream;
import java.nio.charset.Charset;
import java.security.Security;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.concurrent.Future;
import java.util.logging.Handler;
import java.util.logging.Level;
import java.util.logging.LogRecord;
import java.util.logging.Logger;

77 78
import javax.annotation.CheckForNull;
import jenkins.model.Jenkins;
K
Kohsuke Kawaguchi 已提交
79
import static hudson.slaves.SlaveComputer.LogHolder.*;
80
import jenkins.security.ChannelConfigurator;
81
import jenkins.security.MasterToSlaveCallable;
82
import jenkins.slaves.JnlpSlaveAgentProtocol;
83 84
import org.kohsuke.stapler.StaplerRequest;
import org.kohsuke.stapler.StaplerResponse;
85 86 87
import org.kohsuke.stapler.QueryParameter;
import org.kohsuke.stapler.HttpResponse;
import org.kohsuke.stapler.HttpRedirect;
K
Kohsuke Kawaguchi 已提交
88

89

90 91 92 93 94
/**
 * {@link Computer} for {@link Slave}s.
 *
 * @author Kohsuke Kawaguchi
 */
K
kohsuke 已提交
95
public class SlaveComputer extends Computer {
96 97 98 99
    private volatile Channel channel;
    private volatile transient boolean acceptingTasks = true;
    private Charset defaultCharset;
    private Boolean isUnix;
K
kohsuke 已提交
100 101 102 103 104 105
    /**
     * Effective {@link ComputerLauncher} that hides the details of
     * how we launch a slave agent on this computer.
     *
     * <p>
     * This is normally the same as {@link Slave#getLauncher()} but
106
     * can be different. See {@link #grabLauncher(Node)}.
K
kohsuke 已提交
107
     */
108 109
    private ComputerLauncher launcher;

110 111 112 113 114 115 116 117 118 119 120
    /**
     * Perpetually writable log file.
     */
    private final ReopenableFileOutputStream log;

    /**
     * {@link StreamTaskListener} that wraps {@link #log}, hence perpetually writable.
     */
    private final TaskListener taskListener;


121 122 123 124 125 126 127
    /**
     * Number of failed attempts to reconnect to this node
     * (so that if we keep failing to reconnect, we can stop
     * trying.)
     */
    private transient int numRetryAttempt;

K
kohsuke 已提交
128 129 130 131 132 133 134 135
    /**
     * Tracks the status of the last launch operation, which is always asynchronous.
     * This can be used to wait for the completion, or cancel the launch activity.
     */
    private volatile Future<?> lastConnectActivity = null;

    private Object constructed = new Object();

136 137
    private transient volatile String absoluteRemoteFs;

K
kohsuke 已提交
138 139
    public SlaveComputer(Slave slave) {
        super(slave);
140
        this.log = new ReopenableRotatingFileOutputStream(getLogFile(),10);
141
        this.taskListener = new StreamTaskListener(log);
142
        assert slave.getNumExecutors()!=0 : "Computer created with 0 executors";
K
kohsuke 已提交
143
    }
144 145 146 147 148

    /**
     * {@inheritDoc}
     */
    @Override
149
    @OverrideMustInvoke(When.ANYTIME)
150
    public boolean isAcceptingTasks() {
151 152 153
        // our boolean flag is an override on any additional programmatic reasons why this slave might not be
        // accepting tasks.
        return acceptingTasks && super.isAcceptingTasks();
154 155
    }

K
Kohsuke Kawaguchi 已提交
156 157 158
    /**
     * @since 1.498
     */
159 160 161 162
    public String getJnlpMac() {
        return JnlpSlaveAgentProtocol.SLAVE_SECRET.mac(getName());
    }

163
    /**
164 165 166 167 168
     * Allows suspension of tasks being accepted by the slave computer. While this could be called by a
     * {@linkplain hudson.slaves.ComputerLauncher} or a {@linkplain hudson.slaves.RetentionStrategy}, such usage
     * can result in fights between multiple actors calling setting differential values. A better approach
     * is to override {@link hudson.slaves.RetentionStrategy#isAcceptingTasks(hudson.model.Computer)} if the
     * {@link hudson.slaves.RetentionStrategy} needs to control availability.
169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185
     *
     * @param acceptingTasks {@code true} if the slave can accept tasks.
     */
    public void setAcceptingTasks(boolean acceptingTasks) {
        this.acceptingTasks = acceptingTasks;
    }

    /**
     * True if this computer is a Unix machine (as opposed to Windows machine).
     *
     * @return
     *      null if the computer is disconnected and therefore we don't know whether it is Unix or not.
     */
    public Boolean isUnix() {
        return isUnix;
    }

186
    @CheckForNull
187
    @Override
188
    public Slave getNode() {
J
Jesse Glick 已提交
189 190 191 192 193 194 195
        Node node = super.getNode();
        if (node == null || node instanceof Slave) {
            return (Slave)node;
        } else {
            logger.log(Level.WARNING, "found an unexpected kind of node {0} from {1} with nodeName={2}", new Object[] {node, this, nodeName});
            return null;
        }
196 197
    }

K
kohsuke 已提交
198 199 200 201 202 203 204 205
    @Override
    public String getIcon() {
        Future<?> l = lastConnectActivity;
        if(l!=null && !l.isDone())
            return "computer-flash.gif";
        return super.getIcon();
    }

M
mindless 已提交
206 207 208 209
    /**
     * @deprecated since 2008-05-20.
     */
    @Deprecated @Override
210 211 212 213 214 215 216 217 218 219 220 221 222
    public boolean isJnlpAgent() {
        return launcher instanceof JNLPLauncher;
    }

    @Override
    public boolean isLaunchSupported() {
        return launcher.isLaunchSupported();
    }

    public ComputerLauncher getLauncher() {
        return launcher;
    }

223
    protected Future<?> _connect(boolean forceReconnect) {
K
kohsuke 已提交
224
        if(channel!=null)   return Futures.precomputed(null);
225
        if(!forceReconnect && isConnecting())
K
kohsuke 已提交
226
            return lastConnectActivity;
227
        if(forceReconnect && isConnecting())
K
kohsuke 已提交
228
            logger.fine("Forcing a reconnect on "+getName());
229 230

        closeChannel();
K
kohsuke 已提交
231 232
        return lastConnectActivity = Computer.threadPoolForRemoting.submit(new java.util.concurrent.Callable<Object>() {
            public Object call() throws Exception {
233 234
                // do this on another thread so that the lengthy launch operation
                // (which is typical) won't block UI thread.
K
Kohsuke Kawaguchi 已提交
235 236 237

                ACL.impersonate(ACL.SYSTEM);    // background activity should run like a super user

K
kohsuke 已提交
238
                try {
239
                    log.rewind();
240
                    try {
T
Tom Rini 已提交
241
                        for (ComputerListener cl : ComputerListener.all())
242
                            cl.preLaunch(SlaveComputer.this, taskListener);
K
Kohsuke Kawaguchi 已提交
243

244
                        launcher.launch(SlaveComputer.this, taskListener);
245
                    } catch (AbortException e) {
246
                        taskListener.error(e.getMessage());
247 248
                        throw e;
                    } catch (IOException e) {
249 250
                        Util.displayIOException(e,taskListener);
                        e.printStackTrace(taskListener.error(Messages.ComputerLauncher_unexpectedError()));
251 252
                        throw e;
                    } catch (InterruptedException e) {
253
                        e.printStackTrace(taskListener.error(Messages.ComputerLauncher_abortedLaunch()));
254
                        throw e;
255 256 257
                    } catch (Exception e) {
                        e.printStackTrace(taskListener.error(Messages.ComputerLauncher_unexpectedError()));
                        throw e;
258
                    }
259
                } finally {
260
                    if (channel==null) {
261
                        offlineCause = new OfflineCause.LaunchFailed();
262 263 264
                        for (ComputerListener cl : ComputerListener.all())
                            cl.onLaunchFailure(SlaveComputer.this, taskListener);
                    }
K
kohsuke 已提交
265
                }
266 267 268 269

                if (channel==null)
                    throw new IOException("Slave failed to connect, even though the launcher didn't report it. See the log output for details.");
                return null;
270 271 272 273 274 275 276 277 278 279 280 281 282
            }
        });
    }

    /**
     * {@inheritDoc}
     */
    @Override
    public void taskAccepted(Executor executor, Queue.Task task) {
        super.taskAccepted(executor, task);
        if (launcher instanceof ExecutorListener) {
            ((ExecutorListener)launcher).taskAccepted(executor, task);
        }
283

284 285 286 287
        //getNode() can return null at indeterminate times when nodes go offline
        Slave node = getNode();
        if (node != null && node.getRetentionStrategy() instanceof ExecutorListener) {
            ((ExecutorListener)node.getRetentionStrategy()).taskAccepted(executor, task);
288 289 290 291 292 293 294 295 296 297 298 299
        }
    }

    /**
     * {@inheritDoc}
     */
    @Override
    public void taskCompleted(Executor executor, Queue.Task task, long durationMS) {
        super.taskCompleted(executor, task, durationMS);
        if (launcher instanceof ExecutorListener) {
            ((ExecutorListener)launcher).taskCompleted(executor, task, durationMS);
        }
300
        RetentionStrategy r = getRetentionStrategy();
K
kohsuke 已提交
301 302
        if (r instanceof ExecutorListener) {
            ((ExecutorListener) r).taskCompleted(executor, task, durationMS);
303 304 305 306 307 308 309 310 311 312 313 314
        }
    }

    /**
     * {@inheritDoc}
     */
    @Override
    public void taskCompletedWithProblems(Executor executor, Queue.Task task, long durationMS, Throwable problems) {
        super.taskCompletedWithProblems(executor, task, durationMS, problems);
        if (launcher instanceof ExecutorListener) {
            ((ExecutorListener)launcher).taskCompletedWithProblems(executor, task, durationMS, problems);
        }
315 316 317
        RetentionStrategy r = getRetentionStrategy();
        if (r instanceof ExecutorListener) {
            ((ExecutorListener) r).taskCompletedWithProblems(executor, task, durationMS, problems);
318 319 320
        }
    }

K
kohsuke 已提交
321 322 323 324 325 326
    @Override
    public boolean isConnecting() {
        Future<?> l = lastConnectActivity;
        return isOffline() && l!=null && !l.isDone();
    }

327 328
    public OutputStream openLogFile() {
        try {
329 330 331
            log.rewind();
            return log;
        } catch (IOException e) {
332
            logger.log(Level.SEVERE, "Failed to create log file "+getLogFile(),e);
333
            return new NullStream();
334 335 336 337 338
        }
    }

    private final Object channelLock = new Object();

K
kohsuke 已提交
339 340 341 342
    public void setChannel(InputStream in, OutputStream out, TaskListener taskListener, Channel.Listener listener) throws IOException, InterruptedException {
        setChannel(in,out,taskListener.getLogger(),listener);
    }

343 344
    /**
     * Creates a {@link Channel} from the given stream and sets that to this slave.
K
kohsuke 已提交
345 346 347 348 349 350 351 352 353 354 355 356 357
     *
     * @param in
     *      Stream connected to the remote "slave.jar". It's the caller's responsibility to do
     *      buffering on this stream, if that's necessary.
     * @param out
     *      Stream connected to the remote peer. It's the caller's responsibility to do
     *      buffering on this stream, if that's necessary.
     * @param launchLog
     *      If non-null, receive the portion of data in <tt>is</tt> before
     *      the data goes into the "binary mode". This is useful
     *      when the established communication channel might include some data that might
     *      be useful for debugging/trouble-shooting.
     * @param listener
358
     *      Gets a notification when the channel closes, to perform clean up. Can be null.
359 360
     *      By the time this method is called, the cause of the termination is reported to the user,
     *      so the implementation of the listener doesn't need to do that again.
361 362
     */
    public void setChannel(InputStream in, OutputStream out, OutputStream launchLog, Channel.Listener listener) throws IOException, InterruptedException {
K
Kohsuke Kawaguchi 已提交
363 364 365 366
        ChannelBuilder cb = new ChannelBuilder(nodeName,threadPoolForRemoting)
            .withMode(Channel.Mode.NEGOTIATE)
            .withHeaderStream(launchLog);

367 368
        for (ChannelConfigurator cc : ChannelConfigurator.all()) {
            cc.onChannelBuilding(cb,this);
K
Kohsuke Kawaguchi 已提交
369 370 371
        }

        Channel channel = cb.build(in,out);
372 373 374
        setChannel(channel,launchLog,listener);
    }

J
Jesse Glick 已提交
375 376 377 378 379 380 381 382
    /**
     * Shows {@link Channel#classLoadingCount}.
     * @since 1.495
     */
    public int getClassLoadingCount() throws IOException, InterruptedException {
        return channel.call(new LoadingCount(false));
    }

383 384 385
    /**
     * Shows {@link Channel#classLoadingPrefetchCacheCount}.
     * @return -1 in case that capability is not supported
J
Jesse Glick 已提交
386
     * @since 1.519
387 388 389 390 391 392 393 394
     */
    public int getClassLoadingPrefetchCacheCount() throws IOException, InterruptedException {
        if (!channel.remoteCapability.supportsPrefetch()) {
            return -1;
        }
        return channel.call(new LoadingPrefetchCacheCount());
    }

J
Jesse Glick 已提交
395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418
    /**
     * Shows {@link Channel#resourceLoadingCount}.
     * @since 1.495
     */
    public int getResourceLoadingCount() throws IOException, InterruptedException {
        return channel.call(new LoadingCount(true));
    }

    /**
     * Shows {@link Channel#classLoadingTime}.
     * @since 1.495
     */
    public long getClassLoadingTime() throws IOException, InterruptedException {
        return channel.call(new LoadingTime(false));
    }

    /**
     * Shows {@link Channel#resourceLoadingTime}.
     * @since 1.495
     */
    public long getResourceLoadingTime() throws IOException, InterruptedException {
        return channel.call(new LoadingTime(true));
    }

419 420 421 422 423 424 425 426
    /**
     * Returns the remote FS root absolute path or {@code null} if the slave is off-line. The absolute path may change
     * between connections if the connection method does not provide a consistent working directory and the node's
     * remote FS is specified as a relative path.
     *
     * @return the remote FS root absolute path or {@code null} if the slave is off-line.
     * @since 1.FIXME
     */
427 428 429 430 431
    @CheckForNull
    public String getAbsoluteRemoteFs() {
        return channel == null ? null : absoluteRemoteFs;
    }

432
    static class LoadingCount extends MasterToSlaveCallable<Integer,RuntimeException> {
J
Jesse Glick 已提交
433 434 435 436 437 438 439 440 441 442
        private final boolean resource;
        LoadingCount(boolean resource) {
            this.resource = resource;
        }
        @Override public Integer call() {
            Channel c = Channel.current();
            return resource ? c.resourceLoadingCount.get() : c.classLoadingCount.get();
        }
    }

443
    static class LoadingPrefetchCacheCount extends MasterToSlaveCallable<Integer,RuntimeException> {
444 445 446 447 448
        @Override public Integer call() {
            return Channel.current().classLoadingPrefetchCacheCount.get();
        }
    }

449
    static class LoadingTime extends MasterToSlaveCallable<Long,RuntimeException> {
J
Jesse Glick 已提交
450 451 452 453 454 455 456 457 458 459
        private final boolean resource;
        LoadingTime(boolean resource) {
            this.resource = resource;
        }
        @Override public Long call() {
            Channel c = Channel.current();
            return resource ? c.resourceLoadingTime.get() : c.classLoadingTime.get();
        }
    }

460
    /**
461
     * Sets up the connection through an existing channel.
462 463 464 465
     *
     * @since 1.444
     */
    public void setChannel(Channel channel, OutputStream launchLog, Channel.Listener listener) throws IOException, InterruptedException {
466 467 468
        if(this.channel!=null)
            throw new IllegalStateException("Already connected");

469 470
        final TaskListener taskListener = new StreamTaskListener(launchLog);
        PrintStream log = taskListener.getLogger();
471

472 473
        channel.setProperty(SlaveComputer.class, this);

474
        channel.addListener(new Channel.Listener() {
475
            @Override
476 477
            public void onClosed(Channel c, IOException cause) {
                // Orderly shutdown will have null exception
478 479
                if (cause!=null) {
                    offlineCause = new ChannelTermination(cause);
480
                    cause.printStackTrace(taskListener.error("Connection terminated"));
481 482 483
                } else {
                    taskListener.getLogger().println("Connection terminated");
                }
484
                closeChannel();
485
                launcher.afterDisconnect(SlaveComputer.this, taskListener);
486 487
            }
        });
488 489
        if(listener!=null)
            channel.addListener(listener);
490

491 492 493
        String slaveVersion = channel.call(new SlaveVersion());
        log.println("Slave.jar version: " + slaveVersion);

494 495 496 497 498
        boolean _isUnix = channel.call(new DetectOS());
        log.println(_isUnix? hudson.model.Messages.Slave_UnixSlave():hudson.model.Messages.Slave_WindowsSlave());

        String defaultCharsetName = channel.call(new DetectDefaultCharset());

499 500 501 502
        Slave node = getNode();
        if (node == null) { // Node has been disabled/removed during the connection
            throw new IOException("Node "+nodeName+" has been deleted during the channel setup");
        }
503

504 505 506 507
        String remoteFS = node.getRemoteFS();
        if (Util.isRelativePath(remoteFS)) {
            remoteFS = channel.call(new AbsolutePath(remoteFS));
            log.println("NOTE: Relative remote path resolved to: "+remoteFS);
508
        }
509 510 511 512
        if(_isUnix && !remoteFS.contains("/") && remoteFS.contains("\\"))
            log.println("WARNING: "+remoteFS
                    +" looks suspiciously like Windows path. Maybe you meant "+remoteFS.replace('\\','/')+"?");
        FilePath root = new FilePath(channel,remoteFS);
513

K
Kohsuke Kawaguchi 已提交
514 515 516 517 518
        // reference counting problem is known to happen, such as JENKINS-9017, and so as a preventive measure
        // we pin the base classloader so that it'll never get GCed. When this classloader gets released,
        // it'll have a catastrophic impact on the communication.
        channel.pinClassLoader(getClass().getClassLoader());

519
        channel.call(new SlaveInitializer());
520 521 522 523 524 525 526 527
        SecurityContext old = ACL.impersonate(ACL.SYSTEM);
        try {
            for (ComputerListener cl : ComputerListener.all()) {
                cl.preOnline(this,channel,root,taskListener);
            }
        } finally {
            SecurityContextHolder.setContext(old);
        }
528

529 530
        offlineCause = null;

531 532 533 534 535 536 537 538 539 540 541 542 543 544 545
        // update the data structure atomically to prevent others from seeing a channel that's not properly initialized yet
        synchronized(channelLock) {
            if(this.channel!=null) {
                // check again. we used to have this entire method in a big sycnhronization block,
                // but Channel constructor blocks for an external process to do the connection
                // if CommandLauncher is used, and that cannot be interrupted because it blocks at InputStream.
                // so if the process hangs, it hangs the thread in a lock, and since Hudson will try to relaunch,
                // we'll end up queuing the lot of threads in a pseudo deadlock.
                // This implementation prevents that by avoiding a lock. HUDSON-1705 is likely a manifestation of this.
                channel.close();
                throw new IllegalStateException("Already connected");
            }
            isUnix = _isUnix;
            numRetryAttempt = 0;
            this.channel = channel;
546
            this.absoluteRemoteFs = remoteFS;
547
            defaultCharset = Charset.forName(defaultCharsetName);
548 549 550 551

            synchronized (statusChangeLock) {
                statusChangeLock.notifyAll();
            }
552
        }
553 554 555 556 557 558 559 560
        old = ACL.impersonate(ACL.SYSTEM);
        try {
            for (ComputerListener cl : ComputerListener.all()) {
                cl.onOnline(this,taskListener);
            }
        } finally {
            SecurityContextHolder.setContext(old);
        }
A
abayer 已提交
561
        log.println("Slave successfully connected and online");
562
        Jenkins.getInstance().getQueue().scheduleMaintenance();
563 564 565
    }

    @Override
566
    public Channel getChannel() {
567 568 569 570 571 572 573 574 575 576 577
        return channel;
    }

    public Charset getDefaultCharset() {
        return defaultCharset;
    }

    public List<LogRecord> getLogRecords() throws IOException, InterruptedException {
        if(channel==null)
            return Collections.emptyList();
        else
578
            return channel.call(new SlaveLogFetcher());
579 580
    }

581
    @RequirePOST
582 583 584
    public HttpResponse doDoDisconnect(@QueryParameter String offlineMessage) throws IOException, ServletException {
        if (channel!=null) {
            //does nothing in case computer is already disconnected
585
            checkPermission(DISCONNECT);
586
            offlineMessage = Util.fixEmptyAndTrim(offlineMessage);
587
            disconnect(new OfflineCause.UserCause(User.current(), offlineMessage));
588 589
        }
        return new HttpRedirect(".");
590 591 592
    }

    @Override
593 594
    public Future<?> disconnect(OfflineCause cause) {
        super.disconnect(cause);
K
kohsuke 已提交
595
        return Computer.threadPoolForRemoting.submit(new Runnable() {
596 597 598
            public void run() {
                // do this on another thread so that any lengthy disconnect operation
                // (which could be typical) won't block UI thread.
599 600 601
                launcher.beforeDisconnect(SlaveComputer.this, taskListener);
                closeChannel();
                launcher.afterDisconnect(SlaveComputer.this, taskListener);
602 603 604 605
            }
        });
    }

606
    @RequirePOST
607 608
    public void doLaunchSlaveAgent(StaplerRequest req, StaplerResponse rsp) throws IOException, ServletException {
        if(channel!=null) {
609
            req.getView(this,"already-launched.jelly").forward(req, rsp);
610 611 612
            return;
        }

K
kohsuke 已提交
613
        connect(true);
614 615 616 617 618 619 620 621 622 623 624

        // TODO: would be nice to redirect the user to "launching..." wait page,
        // then spend a few seconds there and poll for the completion periodically.
        rsp.sendRedirect("log");
    }

    public void tryReconnect() {
        numRetryAttempt++;
        if(numRetryAttempt<6 || (numRetryAttempt%12)==0) {
            // initially retry several times quickly, and after that, do it infrequently.
            logger.info("Attempting to reconnect "+nodeName);
K
kohsuke 已提交
625
            connect(true);
626 627 628 629 630 631
        }
    }

    /**
     * Serves jar files for JNLP slave agents.
     *
M
mindless 已提交
632
     * @deprecated since 2008-08-18.
633
     *      This URL binding is no longer used and moved up directly under to {@link jenkins.model.Jenkins},
634 635 636 637 638 639
     *      but it's left here for now just in case some old JNLP slave agents request it.
     */
    public Slave.JnlpJar getJnlpJars(String fileName) {
        return new Slave.JnlpJar(fileName);
    }

K
Kohsuke Kawaguchi 已提交
640
    @WebMethod(name="slave-agent.jnlp")
641 642
    public HttpResponse doSlaveAgentJnlp(StaplerRequest req, StaplerResponse res) throws IOException, ServletException {
        return new EncryptedSlaveAgentJnlpFile(this, "slave-agent.jnlp.jelly", getName(), CONNECT);
K
Kohsuke Kawaguchi 已提交
643 644
    }

645 646 647 648
    @Override
    protected void kill() {
        super.kill();
        closeChannel();
K
Kohsuke Kawaguchi 已提交
649
        IOUtils.closeQuietly(log);
650 651 652
    }

    public RetentionStrategy getRetentionStrategy() {
653
        Slave n = getNode();
654
        return n==null ? RetentionStrategy.INSTANCE : n.getRetentionStrategy();
655 656 657 658 659 660 661
    }

    /**
     * If still connected, disconnect.
     */
    private void closeChannel() {
        // TODO: race condition between this and the setChannel method.
662 663 664 665 666 667 668
        Channel c;
        synchronized (channelLock) {
            c = channel;
            channel = null;
            absoluteRemoteFs = null;
            isUnix = null;
        }
669 670 671 672 673 674
        if (c != null) {
            try {
                c.close();
            } catch (IOException e) {
                logger.log(Level.SEVERE, "Failed to terminate channel to " + getDisplayName(), e);
            }
675
            for (ComputerListener cl : ComputerListener.all())
676
                cl.onOffline(this, offlineCause);
677 678 679 680 681 682
        }
    }

    @Override
    protected void setNode(Node node) {
        super.setNode(node);
K
kohsuke 已提交
683
        launcher = grabLauncher(node);
684 685

        // maybe the configuration was changed to relaunch the slave, so try to re-launch now.
K
kohsuke 已提交
686 687
        // "constructed==null" test is an ugly hack to avoid launching before the object is fully
        // constructed.
688 689 690 691 692 693
        if(constructed!=null) {
            if (node instanceof Slave)
                ((Slave)node).getRetentionStrategy().check(this);
            else
                connect(false);
        }
K
kohsuke 已提交
694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709
    }

    /**
     * Grabs a {@link ComputerLauncher} out of {@link Node} to keep it in this {@link Computer}.
     * The returned launcher will be set to {@link #launcher} and used to carry out the actual launch operation.
     *
     * <p>
     * Subtypes that needs to decorate {@link ComputerLauncher} can do so by overriding this method.
     * This is useful for {@link SlaveComputer}s for clouds for example, where one normally needs
     * additional pre-launch step (such as waiting for the provisioned node to become available)
     * before the user specified launch step (like SSH connection) kicks in.
     *
     * @see ComputerLauncherFilter
     */
    protected ComputerLauncher grabLauncher(Node node) {
        return ((Slave)node).getLauncher();
710 711
    }

712 713 714 715 716 717 718 719 720 721 722 723 724 725
    /**
     * Get the slave version
     */
    public String getSlaveVersion() throws IOException, InterruptedException {
        return channel.call(new SlaveVersion());
    }

    /**
     * Get the OS description.
     */
    public String getOSDescription() throws IOException, InterruptedException {
        return channel.call(new DetectOS()) ? "Unix" : "Windows";
    }

726 727
    private static final Logger logger = Logger.getLogger(SlaveComputer.class.getName());

728
    private static final class SlaveVersion extends MasterToSlaveCallable<String,IOException> {
729 730 731 732 733
        public String call() throws IOException {
            try { return Launcher.VERSION; }
            catch (Throwable ex) { return "< 1.335"; } // Older slave.jar won't have VERSION
        }
    }
734
    private static final class DetectOS extends MasterToSlaveCallable<Boolean,IOException> {
735 736 737 738 739
        public Boolean call() throws IOException {
            return File.pathSeparatorChar==':';
        }
    }

740
    private static final class AbsolutePath extends MasterToSlaveCallable<String,IOException> {
741 742 743

        private static final long serialVersionUID = 1L;

744 745 746 747 748 749 750 751 752 753 754
        private final String relativePath;

        private AbsolutePath(String relativePath) {
            this.relativePath = relativePath;
        }

        public String call() throws IOException {
            return new File(relativePath).getAbsolutePath();
        }
    }

755
    private static final class DetectDefaultCharset extends MasterToSlaveCallable<String,IOException> {
756 757 758 759 760 761
        public String call() throws IOException {
            return Charset.defaultCharset().name();
        }
    }

    /**
762 763
     * Puts the {@link #SLAVE_LOG_HANDLER} into a separate class so that loading this class
     * in JVM doesn't end up loading tons of additional classes.
764
     */
765 766 767 768 769 770
    static final class LogHolder {
        /**
         * This field is used on each slave node to record log records on the slave.
         */
        static final RingBufferLogHandler SLAVE_LOG_HANDLER = new RingBufferLogHandler();
    }
771

772
    private static class SlaveInitializer extends MasterToSlaveCallable<Void,RuntimeException> {
773
        public Void call() {
774 775 776
            // avoid double installation of the handler. JNLP slaves can reconnect to the master multiple times
            // and each connection gets a different RemoteClassLoader, so we need to evict them by class name,
            // not by their identity.
K
Kohsuke Kawaguchi 已提交
777
            for (Handler h : LOGGER.getHandlers()) {
778
                if (h.getClass().getName().equals(SLAVE_LOG_HANDLER.getClass().getName()))
K
Kohsuke Kawaguchi 已提交
779
                    LOGGER.removeHandler(h);
780
            }
K
Kohsuke Kawaguchi 已提交
781
            LOGGER.addHandler(SLAVE_LOG_HANDLER);
782

K
Kohsuke Kawaguchi 已提交
783
            // remove Sun PKCS11 provider if present. See http://wiki.jenkins-ci.org/display/JENKINS/Solaris+Issue+6276483
784 785 786 787 788 789
            try {
                Security.removeProvider("SunPKCS11-Solaris");
            } catch (SecurityException e) {
                // ignore this error.
            }

790
            Channel.current().setProperty("slave",Boolean.TRUE); // indicate that this side of the channel is the slave side.
791

792 793 794
            return null;
        }
        private static final long serialVersionUID = 1L;
795
        private static final Logger LOGGER = Logger.getLogger("");
796
    }
797 798 799 800 801 802 803 804 805 806 807

    /**
     * Obtains a {@link VirtualChannel} that allows some computation to be performed on the master.
     * This method can be called from any thread on the master, or from slave (more precisely,
     * it only works from the remoting request-handling thread in slaves, which means if you've started
     * separate thread on slaves, that'll fail.)
     *
     * @return null if the calling thread doesn't have any trace of where its master is.
     * @since 1.362
     */
    public static VirtualChannel getChannelToMaster() {
808
        if (Jenkins.getInstance()!=null)
K
Kohsuke Kawaguchi 已提交
809
            return FilePath.localChannel;
810 811 812

        // if this method is called from within the slave computation thread, this should work
        Channel c = Channel.current();
813
        if (c!=null && Boolean.TRUE.equals(c.getProperty("slave")))
814 815 816 817
            return c;

        return null;
    }
818

819 820 821 822 823 824 825
    /**
     * Helper method for Jelly.
     */
    public static List<SlaveSystemInfo> getSystemInfoExtensions() {
        return SlaveSystemInfo.all();
    }

826
    private static class SlaveLogFetcher extends MasterToSlaveCallable<List<LogRecord>,RuntimeException> {
827 828 829 830
        public List<LogRecord> call() {
            return new ArrayList<LogRecord>(SLAVE_LOG_HANDLER.getView());
        }
    }
831
}