blob: 9140f9eb08458fd7163dfa724e5452f800c7dc6f [file] [log] [blame]
// Copyright 2023 The Dawn & Tint Authors
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice, this
// list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
//
// 3. Neither the name of the copyright holder nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#ifndef SRC_DAWN_NATIVE_EXECUTIONQUEUE_H_
#define SRC_DAWN_NATIVE_EXECUTIONQUEUE_H_
#include <atomic>
#include <condition_variable>
#include <functional>
#include <mutex>
#include <vector>
#include "dawn/common/MutexProtected.h"
#include "dawn/common/RefCounted.h"
#include "dawn/common/SerialMap.h"
#include "dawn/common/Time.h"
#include "dawn/common/ityp_array.h"
#include "dawn/native/Error.h"
#include "dawn/native/IntegerTypes.h"
#include "dawn/native/ObjectBase.h"
#include "partition_alloc/pointers/raw_ptr.h"
namespace dawn::native {
// Queue task priority can be specified such that when user facing code is called, i.e. |WaitAny|,
// we can do the minimum amount of work to remain responsive. For other classes of priority, we may
// defer and execute them either on another thread if full spontaneous is enabled, or when
// |Tick| is called in the meantime. Higher numeric values correspond to higher priority. Note that
// this is loosely based off of TaskPriority in Chromium:
// https://source.chromium.org/chromium/chromium/src/+/main:base/task/task_traits.h
// Note that when the queue is asked to process tasks of a given priorty, it will process any tasks
// of that priority or higher.
enum class QueuePriority : size_t {
// This will always be the lowest priority available. We use 1 instead of 0 because we implement
// a decrement operator to iterate through the priorities and by reserving 0, we can assert that
// we don't underflow.
Lowest = 1,
BestEffort = Lowest,
UserVisible,
Highest = UserVisible,
};
// Represents an engine which processes a stream of GPU work. It handles the tracking and
// update of the various ExecutionSerials related to that work.
// TODO(dawn:831, dawn:1413): Make usage of the ExecutionQueue thread-safe. Right now it is
// only partially safe - where observation of the last-submitted and pending serials is atomic.
class ExecutionQueueBase : public ApiObjectBase {
public:
using Task = std::function<void()>;
// Implementations of this class are registered to the queue such that when the serial tracked
// by the queue increases, the processor is notified and updated as well. Prefer registering a
// SerialProcessor over tracking a SerialTask when the task would need to keep track of extended
// state, happen frequently, or acquire the same lock multiple times if split into separate
// tasks. Implementations must also be thread-safe.
class SerialProcessor : public RefCounted {
public:
// This is the entry point that's fired whenever the queue's internal completed serial is
// updated.
virtual void UpdateCompletedSerialTo(ExecutionSerial completedSerial) = 0;
// Implementations need to implement this shut down function to set some internal state such
// that any further tracking on the processor is processed immediately since the
// |UpdateCompletedSerialTo| entry point will no longer be called after this point.
virtual void AssumeCommandsComplete() = 0;
};
// The latest serial known to have completed execution on the queue.
ExecutionSerial GetCompletedCommandSerial() const;
// The serial of the latest batch of work sent for execution.
ExecutionSerial GetLastSubmittedCommandSerial() const;
// The serial of the batch that is currently pending submission.
ExecutionSerial GetPendingCommandSerial() const;
// The serial by which time all currently submitted or pending operations will be completed.
ExecutionSerial GetScheduledWorkDoneSerial() const;
// Whether the execution queue has scheduled commands to be submitted or executing.
bool HasScheduledCommands() const;
// Check for passed fences and set the new completed serial. Note that the two functions below
// effectively do the same thing initially, however, |UpdateCompletedSerials| may additionally
// trigger user callbacks. Note that for the purpose of going forwards, |CheckPassedSerials|
// should not be used anymore.
// TODO(crbug.com/42240396): Remove |CheckPassedSerials| in favor of |UpdateCompletedSerial|.
MaybeError CheckPassedSerials();
MaybeError UpdateCompletedSerial(QueuePriority priority);
// For the commands being internally recorded in backend, that were not urgent to submit, this
// method makes them to be submitted as soon as possible in next ticks.
virtual void ForceEventualFlushOfCommands() = 0;
// Ensures that all commands which were recorded are flushed upto the given serial.
MaybeError EnsureCommandsFlushed(ExecutionSerial serial);
// Submit any pending commands that are enqueued.
MaybeError SubmitPendingCommands();
// During shut down of device, some operations might have been started since the last submit
// and waiting on a serial that doesn't have a corresponding fence enqueued. Fake serials to
// make all commands look completed.
void AssumeCommandsComplete();
// Increment mLastSubmittedSerial when we submit the next serial
void IncrementLastSubmittedCommandSerial();
// Waits for GPU to finish, checks errors and gets ready for destruction. This is only used when
// properly destructing the device. For a real device loss, this function doesn't need to be
// called since the driver already closed all resources.
MaybeError WaitForIdleForDestruction();
// Wait at most `timeout` synchronously for the ExecutionSerial to pass.
MaybeError WaitForQueueSerial(ExecutionSerial serial, Nanoseconds timeout);
// Registers a SerialProcessor that will be notified of serial updates. Note that serial
// processors are always notified before handling serial tasks.
void RegisterSerialProcessor(QueuePriority priority, Ref<SerialProcessor>&& serialProcessor);
// Tracks new tasks to complete when |serial| is reached.
void TrackSerialTask(QueuePriority priority, ExecutionSerial serial, Task&& task);
// In the 'Normal' mode, currently recorded commands in the backend submitted in the next Tick.
// However in the 'Passive' mode, the submission will be postponed as late as possible, for
// example, until the client has explictly issued a submission.
enum class SubmitMode { Normal, Passive };
protected:
using ApiObjectBase::ApiObjectBase;
~ExecutionQueueBase() override;
static constexpr ExecutionSerial kWaitSerialTimeout = kBeginningOfGPUTime;
// Currently, the queue has two paths for serial updating, one is via DeviceBase::Tick which
// calls into the backend specific polling mechanisms implemented in
// CheckAndUpdateCompletedSerials. Alternatively, the backend can actively call
// UpdateCompletedSerialTo when a new serial is complete to make forward progress proactively.
void UpdateCompletedSerialTo(QueuePriority priority, ExecutionSerial completedSerial);
private:
// Each backend should implement to check their passed fences if there are any and return a
// completed serial. Return 0 should indicate no fences to check.
virtual ResultOrError<ExecutionSerial> CheckAndUpdateCompletedSerials() = 0;
// Backend specific wait function, returns kWaitSerialTimeout if we did not successfully wait
// for |waitSerial|. The default implementations just waits on the internal condition variable
// protected |mCompletedSerial|.
virtual ResultOrError<ExecutionSerial> WaitForQueueSerialImpl(ExecutionSerial waitSerial,
Nanoseconds timeout);
// Backend specific wait for idle function.
virtual MaybeError WaitForIdleForDestructionImpl() = 0;
// Indicates whether the backend has pending commands to be submitted as soon as possible.
virtual bool HasPendingCommands() const = 0;
// Submit any pending commands that are enqueued.
virtual MaybeError SubmitPendingCommandsImpl() = 0;
void UpdateCompletedSerialToInternal(QueuePriority priority,
ExecutionSerial completedSerial,
bool forceTasks = false);
// |mCompletedSerial| tracks the last completed command serial that the fence has returned.
// |mLastSubmittedSerial| tracks the last submitted command serial.
// During device removal, the serials could be artificially incremented to make it appear as if
// commands have been completed.
MutexCondVarProtected<uint64_t> mCompletedSerial = static_cast<uint64_t>(kBeginningOfGPUTime);
std::atomic<uint64_t> mLastSubmittedSerial = static_cast<uint64_t>(kBeginningOfGPUTime);
// Mutex, condition variable, and boolean statuses are used by the class to synchronize task
// completion to ensure that:
// 1) Callback ordering is guaranteed.
// 2) Re-entrant callbacks do not cause lock-inversion issues w.r.t this lock and the
// device lock.
template <typename T>
using QueuePriorityArray =
ityp::array<QueuePriority, T, static_cast<size_t>(QueuePriority::Highest) + 1>;
struct State {
bool mCallingCallbacks = false;
bool mWaitingForIdle = false;
bool mAssumeCompleted = false;
QueuePriorityArray<std::vector<Ref<SerialProcessor>>> mWaitingProcessors;
QueuePriorityArray<SerialMap<ExecutionSerial, Task>> mWaitingTasks;
};
MutexCondVarProtected<State> mState;
};
} // namespace dawn::native
#endif // SRC_DAWN_NATIVE_EXECUTIONQUEUE_H_