taskqueue.cpp 8.0 KB
Newer Older
D
duke 已提交
1
/*
X
xdono 已提交
2
 * Copyright 2001-2009 Sun Microsystems, Inc.  All Rights Reserved.
D
duke 已提交
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
 * CA 95054 USA or visit www.sun.com if you need additional information or
 * have any questions.
 *
 */

# include "incls/_precompiled.incl"
# include "incls/_taskqueue.cpp.incl"

28 29 30 31 32 33
#ifdef TRACESPINNING
uint ParallelTaskTerminator::_total_yields = 0;
uint ParallelTaskTerminator::_total_spins = 0;
uint ParallelTaskTerminator::_total_peeks = 0;
#endif

D
duke 已提交
34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66
bool TaskQueueSuper::peek() {
  return _bottom != _age.top();
}

int TaskQueueSetSuper::randomParkAndMiller(int *seed0) {
  const int a =      16807;
  const int m = 2147483647;
  const int q =     127773;  /* m div a */
  const int r =       2836;  /* m mod a */
  assert(sizeof(int) == 4, "I think this relies on that");
  int seed = *seed0;
  int hi   = seed / q;
  int lo   = seed % q;
  int test = a * lo - r * hi;
  if (test > 0)
    seed = test;
  else
    seed = test + m;
  *seed0 = seed;
  return seed;
}

ParallelTaskTerminator::
ParallelTaskTerminator(int n_threads, TaskQueueSetSuper* queue_set) :
  _n_threads(n_threads),
  _queue_set(queue_set),
  _offered_termination(0) {}

bool ParallelTaskTerminator::peek_in_queue_set() {
  return _queue_set->peek();
}

void ParallelTaskTerminator::yield() {
67
  assert(_offered_termination <= _n_threads, "Invariant");
D
duke 已提交
68 69 70 71
  os::yield();
}

void ParallelTaskTerminator::sleep(uint millis) {
72
  assert(_offered_termination <= _n_threads, "Invariant");
D
duke 已提交
73 74 75
  os::sleep(Thread::current(), millis, false);
}

76 77
bool
ParallelTaskTerminator::offer_termination(TerminatorTerminator* terminator) {
78
  assert(_offered_termination < _n_threads, "Invariant");
D
duke 已提交
79 80
  Atomic::inc(&_offered_termination);

81
  uint yield_count = 0;
82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100
  // Number of hard spin loops done since last yield
  uint hard_spin_count = 0;
  // Number of iterations in the hard spin loop.
  uint hard_spin_limit = WorkStealingHardSpins;

  // If WorkStealingSpinToYieldRatio is 0, no hard spinning is done.
  // If it is greater than 0, then start with a small number
  // of spins and increase number with each turn at spinning until
  // the count of hard spins exceeds WorkStealingSpinToYieldRatio.
  // Then do a yield() call and start spinning afresh.
  if (WorkStealingSpinToYieldRatio > 0) {
    hard_spin_limit = WorkStealingHardSpins >> WorkStealingSpinToYieldRatio;
    hard_spin_limit = MAX2(hard_spin_limit, 1U);
  }
  // Remember the initial spin limit.
  uint hard_spin_start = hard_spin_limit;

  // Loop waiting for all threads to offer termination or
  // more work.
D
duke 已提交
101
  while (true) {
102
    assert(_offered_termination <= _n_threads, "Invariant");
103
    // Are all threads offering termination?
D
duke 已提交
104 105 106
    if (_offered_termination == _n_threads) {
      return true;
    } else {
107 108 109
      // Look for more work.
      // Periodically sleep() instead of yield() to give threads
      // waiting on the cores the chance to grab this code
D
duke 已提交
110
      if (yield_count <= WorkStealingYieldsBeforeSleep) {
111 112
        // Do a yield or hardspin.  For purposes of deciding whether
        // to sleep, count this as a yield.
D
duke 已提交
113
        yield_count++;
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137

        // Periodically call yield() instead spinning
        // After WorkStealingSpinToYieldRatio spins, do a yield() call
        // and reset the counts and starting limit.
        if (hard_spin_count > WorkStealingSpinToYieldRatio) {
          yield();
          hard_spin_count = 0;
          hard_spin_limit = hard_spin_start;
#ifdef TRACESPINNING
          _total_yields++;
#endif
        } else {
          // Hard spin this time
          // Increase the hard spinning period but only up to a limit.
          hard_spin_limit = MIN2(2*hard_spin_limit,
                                 (uint) WorkStealingHardSpins);
          for (uint j = 0; j < hard_spin_limit; j++) {
            SpinPause();
          }
          hard_spin_count++;
#ifdef TRACESPINNING
          _total_spins++;
#endif
        }
D
duke 已提交
138 139 140 141 142 143 144 145 146 147 148 149 150 151
      } else {
        if (PrintGCDetails && Verbose) {
         gclog_or_tty->print_cr("ParallelTaskTerminator::offer_termination() "
           "thread %d sleeps after %d yields",
           Thread::current(), yield_count);
        }
        yield_count = 0;
        // A sleep will cause this processor to seek work on another processor's
        // runqueue, if it has nothing else to run (as opposed to the yield
        // which may only move the thread to the end of the this processor's
        // runqueue).
        sleep(WorkStealingSleepMillis);
      }

152 153 154
#ifdef TRACESPINNING
      _total_peeks++;
#endif
155 156
      if (peek_in_queue_set() ||
          (terminator != NULL && terminator->should_exit_termination())) {
D
duke 已提交
157
        Atomic::dec(&_offered_termination);
158
        assert(_offered_termination < _n_threads, "Invariant");
D
duke 已提交
159 160 161 162 163 164
        return false;
      }
    }
  }
}

165 166 167 168 169 170 171 172 173 174
#ifdef TRACESPINNING
void ParallelTaskTerminator::print_termination_counts() {
  gclog_or_tty->print_cr("ParallelTaskTerminator Total yields: %lld  "
    "Total spins: %lld  Total peeks: %lld",
    total_yields(),
    total_spins(),
    total_peeks());
}
#endif

D
duke 已提交
175 176 177 178 179 180 181 182
void ParallelTaskTerminator::reset_for_reuse() {
  if (_offered_termination != 0) {
    assert(_offered_termination == _n_threads,
           "Terminator may still be in use");
    _offered_termination = 0;
  }
}

183 184
bool RegionTaskQueueWithOverflow::is_empty() {
  return (_region_queue.size() == 0) &&
D
duke 已提交
185 186 187
         (_overflow_stack->length() == 0);
}

188 189
bool RegionTaskQueueWithOverflow::stealable_is_empty() {
  return _region_queue.size() == 0;
D
duke 已提交
190 191
}

192
bool RegionTaskQueueWithOverflow::overflow_is_empty() {
D
duke 已提交
193 194 195
  return _overflow_stack->length() == 0;
}

196 197
void RegionTaskQueueWithOverflow::initialize() {
  _region_queue.initialize();
D
duke 已提交
198 199
  assert(_overflow_stack == 0, "Creating memory leak");
  _overflow_stack =
200
    new (ResourceObj::C_HEAP) GrowableArray<RegionTask>(10, true);
D
duke 已提交
201 202
}

203 204
void RegionTaskQueueWithOverflow::save(RegionTask t) {
  if (TraceRegionTasksQueuing && Verbose) {
D
duke 已提交
205 206
    gclog_or_tty->print_cr("CTQ: save " PTR_FORMAT, t);
  }
207
  if(!_region_queue.push(t)) {
D
duke 已提交
208 209 210 211
    _overflow_stack->push(t);
  }
}

212
// Note that using this method will retrieve all regions
D
duke 已提交
213 214 215 216
// that have been saved but that it will always check
// the overflow stack.  It may be more efficient to
// check the stealable queue and the overflow stack
// separately.
217 218
bool RegionTaskQueueWithOverflow::retrieve(RegionTask& region_task) {
  bool result = retrieve_from_overflow(region_task);
D
duke 已提交
219
  if (!result) {
220
    result = retrieve_from_stealable_queue(region_task);
D
duke 已提交
221
  }
222
  if (TraceRegionTasksQueuing && Verbose && result) {
D
duke 已提交
223 224 225 226 227
    gclog_or_tty->print_cr("  CTQ: retrieve " PTR_FORMAT, result);
  }
  return result;
}

228 229 230 231 232
bool RegionTaskQueueWithOverflow::retrieve_from_stealable_queue(
                                   RegionTask& region_task) {
  bool result = _region_queue.pop_local(region_task);
  if (TraceRegionTasksQueuing && Verbose) {
    gclog_or_tty->print_cr("CTQ: retrieve_stealable " PTR_FORMAT, region_task);
D
duke 已提交
233 234 235 236
  }
  return result;
}

237 238
bool
RegionTaskQueueWithOverflow::retrieve_from_overflow(RegionTask& region_task) {
D
duke 已提交
239 240
  bool result;
  if (!_overflow_stack->is_empty()) {
241
    region_task = _overflow_stack->pop();
D
duke 已提交
242 243
    result = true;
  } else {
244
    region_task = (RegionTask) NULL;
D
duke 已提交
245 246
    result = false;
  }
247 248
  if (TraceRegionTasksQueuing && Verbose) {
    gclog_or_tty->print_cr("CTQ: retrieve_stealable " PTR_FORMAT, region_task);
D
duke 已提交
249 250 251
  }
  return result;
}