src/hotspot/share/gc/shared/partialArrayTaskStepper.inline.hpp - toolchain/jdk/jdk21 - Git at Google

 /*
  * Copyright (c) 2020, 2023, Oracle and/or its affiliates. All rights reserved.
  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  *
  * This code is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License version 2 only, as
  * published by the Free Software Foundation.
  *
  * This code is distributed in the hope that it will be useful, but WITHOUT
  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  * version 2 for more details (a copy is included in the LICENSE file that
  * accompanied this code).
  *
  * You should have received a copy of the GNU General Public License version
  * 2 along with this work; if not, write to the Free Software Foundation,
  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  *
  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  * or visit www.oracle.com if you need additional information or have any
  * questions.
  *
  */

 #ifndef SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP
 #define SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP

 #include "gc/shared/partialArrayTaskStepper.hpp"

 #include "oops/arrayOop.hpp"
 #include "runtime/atomic.hpp"

 PartialArrayTaskStepper::Step
 PartialArrayTaskStepper::start_impl(int length,
                                     int* to_length_addr,
                                     int chunk_size) const {
   assert(chunk_size > 0, "precondition");

   int end = length % chunk_size; // End of initial chunk.
   // Set to's length to end of initial chunk.  Partial tasks use that length
   // field as the start of the next chunk to process.  Must be done before
   // enqueuing partial scan tasks, in case other threads steal any of those
   // tasks.
   //
   // The value of end can be 0, either because of a 0-length array or
   // because length is a multiple of the chunk size.  Both of those are
   // relatively rare and handled in the normal course of the iteration, so
   // not worth doing anything special about here.
   *to_length_addr = end;

   // If the initial chunk is the complete array, then don't need any partial
   // tasks.  Otherwise, start with just one partial task; see new task
   // calculation in next().
   Step result = { end, (length > end) ? 1u : 0u };
   return result;
 }

 PartialArrayTaskStepper::Step
 PartialArrayTaskStepper::start(arrayOop from, arrayOop to, int chunk_size) const {
   return start_impl(from->length(), to->length_addr(), chunk_size);
 }

 PartialArrayTaskStepper::Step
 PartialArrayTaskStepper::next_impl(int length,
                                    int* to_length_addr,
                                    int chunk_size) const {
   assert(chunk_size > 0, "precondition");

   // The start of the next task is in the length field of the to-space object.
   // Atomically increment by the chunk size to claim the associated chunk.
   // Because we limit the number of enqueued tasks to being no more than the
   // number of remaining chunks to process, we can use an atomic add for the
   // claim, rather than a CAS loop.
   int start = Atomic::fetch_then_add(to_length_addr,
                                      chunk_size,
                                      memory_order_relaxed);

   assert(start < length, "invariant: start %d, length %d", start, length);
   assert(((length - start) % chunk_size) == 0,
          "invariant: start %d, length %d, chunk size %d",
          start, length, chunk_size);

   // Determine the number of new tasks to create.
   // Zero-based index for this partial task.  The initial task isn't counted.
   uint task_num = (start / chunk_size);
   // Number of tasks left to process, including this one.
   uint remaining_tasks = (length - start) / chunk_size;
   assert(remaining_tasks > 0, "invariant");
   // Compute number of pending tasks, including this one.  The maximum number
   // of tasks is a function of task_num (N) and _task_fanout (F).
   //   1    : current task
   //   N    : number of preceding tasks
   //   F*N  : maximum created for preceding tasks
   // => F*N - N + 1 : maximum number of tasks
   // => (F-1)*N + 1
   assert(_task_limit > 0, "precondition");
   assert(_task_fanout > 0, "precondition");
   uint max_pending = (_task_fanout - 1) * task_num + 1;

   // The actual pending may be less than that.  Bound by remaining_tasks to
   // not overrun.  Also bound by _task_limit to avoid spawning an excessive
   // number of tasks for a large array.  The +1 is to replace the current
   // task with a new task when _task_limit limited.  The pending value may
   // not be what's actually in the queues, because of concurrent task
   // processing.  That's okay; we just need to determine the correct number
   // of tasks to add for this task.
   uint pending = MIN3(max_pending, remaining_tasks, _task_limit);
   uint ncreate = MIN2(_task_fanout, MIN2(remaining_tasks, _task_limit + 1) - pending);
   Step result = { start, ncreate };
   return result;
 }

 PartialArrayTaskStepper::Step
 PartialArrayTaskStepper::next(arrayOop from, arrayOop to, int chunk_size) const {
   return next_impl(from->length(), to->length_addr(), chunk_size);
 }

 #endif // SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP
	/*
	* Copyright (c) 2020, 2023, Oracle and/or its affiliates. All rights reserved.
	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
	*
	* This code is free software; you can redistribute it and/or modify it
	* under the terms of the GNU General Public License version 2 only, as
	* published by the Free Software Foundation.
	*
	* This code is distributed in the hope that it will be useful, but WITHOUT
	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
	* version 2 for more details (a copy is included in the LICENSE file that
	* accompanied this code).
	*
	* You should have received a copy of the GNU General Public License version
	* 2 along with this work; if not, write to the Free Software Foundation,
	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
	*
	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
	* or visit www.oracle.com if you need additional information or have any
	* questions.
	*
	*/

	#ifndef SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP
	#define SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP

	#include "gc/shared/partialArrayTaskStepper.hpp"

	#include "oops/arrayOop.hpp"
	#include "runtime/atomic.hpp"

	PartialArrayTaskStepper::Step
	PartialArrayTaskStepper::start_impl(int length,
	int* to_length_addr,
	int chunk_size) const {
	assert(chunk_size > 0, "precondition");

	int end = length % chunk_size; // End of initial chunk.
	// Set to's length to end of initial chunk. Partial tasks use that length
	// field as the start of the next chunk to process. Must be done before
	// enqueuing partial scan tasks, in case other threads steal any of those
	// tasks.
	//
	// The value of end can be 0, either because of a 0-length array or
	// because length is a multiple of the chunk size. Both of those are
	// relatively rare and handled in the normal course of the iteration, so
	// not worth doing anything special about here.
	*to_length_addr = end;

	// If the initial chunk is the complete array, then don't need any partial
	// tasks. Otherwise, start with just one partial task; see new task
	// calculation in next().
	Step result = { end, (length > end) ? 1u : 0u };
	return result;
	}

	PartialArrayTaskStepper::Step
	PartialArrayTaskStepper::start(arrayOop from, arrayOop to, int chunk_size) const {
	return start_impl(from->length(), to->length_addr(), chunk_size);
	}

	PartialArrayTaskStepper::Step
	PartialArrayTaskStepper::next_impl(int length,
	int* to_length_addr,
	int chunk_size) const {
	assert(chunk_size > 0, "precondition");

	// The start of the next task is in the length field of the to-space object.
	// Atomically increment by the chunk size to claim the associated chunk.
	// Because we limit the number of enqueued tasks to being no more than the
	// number of remaining chunks to process, we can use an atomic add for the
	// claim, rather than a CAS loop.
	int start = Atomic::fetch_then_add(to_length_addr,
	chunk_size,
	memory_order_relaxed);

	assert(start < length, "invariant: start %d, length %d", start, length);
	assert(((length - start) % chunk_size) == 0,
	"invariant: start %d, length %d, chunk size %d",
	start, length, chunk_size);

	// Determine the number of new tasks to create.
	// Zero-based index for this partial task. The initial task isn't counted.
	uint task_num = (start / chunk_size);
	// Number of tasks left to process, including this one.
	uint remaining_tasks = (length - start) / chunk_size;
	assert(remaining_tasks > 0, "invariant");
	// Compute number of pending tasks, including this one. The maximum number
	// of tasks is a function of task_num (N) and _task_fanout (F).
	// 1 : current task
	// N : number of preceding tasks
	// F*N : maximum created for preceding tasks
	// => F*N - N + 1 : maximum number of tasks
	// => (F-1)*N + 1
	assert(_task_limit > 0, "precondition");
	assert(_task_fanout > 0, "precondition");
	uint max_pending = (_task_fanout - 1) * task_num + 1;

	// The actual pending may be less than that. Bound by remaining_tasks to
	// not overrun. Also bound by _task_limit to avoid spawning an excessive
	// number of tasks for a large array. The +1 is to replace the current
	// task with a new task when _task_limit limited. The pending value may
	// not be what's actually in the queues, because of concurrent task
	// processing. That's okay; we just need to determine the correct number
	// of tasks to add for this task.
	uint pending = MIN3(max_pending, remaining_tasks, _task_limit);
	uint ncreate = MIN2(_task_fanout, MIN2(remaining_tasks, _task_limit + 1) - pending);
	Step result = { start, ncreate };
	return result;
	}

	PartialArrayTaskStepper::Step
	PartialArrayTaskStepper::next(arrayOop from, arrayOop to, int chunk_size) const {
	return next_impl(from->length(), to->length_addr(), chunk_size);
	}

	#endif // SHARE_GC_SHARED_PARTIALARRAYTASKSTEPPER_INLINE_HPP