blob: 171df2a71b09d9ac7582724c885c6bfb8fb2e8db [file] [log] [blame]
/*
* MVKSync.mm
*
* Copyright (c) 2014-2019 The Brenwill Workshop Ltd. (http://www.brenwill.com)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "MVKSync.h"
#include "MVKFoundation.h"
#include "MVKLogging.h"
using namespace std;
#pragma mark -
#pragma mark MVKSemaphoreImpl
bool MVKSemaphoreImpl::release() {
lock_guard<mutex> lock(_lock);
if (isClear()) { return true; }
// Either decrement the reservation counter, or clear it altogether
if (_shouldWaitAll) {
if (_reservationCount > 0) { _reservationCount--; }
} else {
_reservationCount = 0;
}
// If all reservations have been released, unblock all waiting threads
if ( isClear() ) { _blocker.notify_all(); }
return isClear();
}
void MVKSemaphoreImpl::reserve() {
lock_guard<mutex> lock(_lock);
_reservationCount++;
}
bool MVKSemaphoreImpl::wait(uint64_t timeout, bool reserveAgain) {
unique_lock<mutex> lock(_lock);
bool isDone;
if (timeout == 0) {
isDone = isClear();
} else if (timeout == UINT64_MAX) {
_blocker.wait(lock, [this]{ return isClear(); });
isDone = true;
} else {
// Limit timeout to avoid overflow since wait_for() uses wait_until()
uint64_t nanoTimeout = min(timeout, kMVKUndefinedLargeUInt64);
chrono::nanoseconds nanos(nanoTimeout);
isDone = _blocker.wait_for(lock, nanos, [this]{ return isClear(); });
}
if (reserveAgain) { _reservationCount++; }
return isDone;
}
MVKSemaphoreImpl::~MVKSemaphoreImpl() {
// Acquire the lock to ensure proper ordering.
lock_guard<mutex> lock(_lock);
}
#pragma mark -
#pragma mark MVKSemaphore
bool MVKSemaphore::wait(uint64_t timeout) {
bool isDone = _blocker.wait(timeout, true);
if ( !isDone && timeout > 0 ) { reportError(VK_TIMEOUT, "Vulkan semaphore timeout after %llu nanoseconds.", timeout); }
return isDone;
}
void MVKSemaphore::signal() {
_blocker.release();
}
void MVKSemaphore::encodeWait(id<MTLCommandBuffer> cmdBuff) {
[cmdBuff encodeWaitForEvent: _mtlEvent value: _mtlEventValue];
++_mtlEventValue;
}
void MVKSemaphore::encodeSignal(id<MTLCommandBuffer> cmdBuff) {
[cmdBuff encodeSignalEvent: _mtlEvent value: _mtlEventValue];
}
MVKSemaphore::MVKSemaphore(MVKDevice* device, const VkSemaphoreCreateInfo* pCreateInfo)
: MVKVulkanAPIDeviceObject(device), _blocker(false, 1), _mtlEvent(nil), _mtlEventValue(1) {
if (device->_pMetalFeatures->events) {
_mtlEvent = [device->getMTLDevice() newEvent];
}
}
MVKSemaphore::~MVKSemaphore() {
[_mtlEvent release];
}
#pragma mark -
#pragma mark MVKFence
void MVKFence::addSitter(MVKFenceSitter* fenceSitter) {
lock_guard<mutex> lock(_lock);
// We only care about unsignaled fences. If already signaled,
// don't add myself to the sitter and don't signal the sitter.
if (_isSignaled) { return; }
// Ensure each fence only added once to each fence sitter
auto addRslt = _fenceSitters.insert(fenceSitter); // pair with second element true if was added
if (addRslt.second) { fenceSitter->awaitFence(this); }
}
void MVKFence::removeSitter(MVKFenceSitter* fenceSitter) {
lock_guard<mutex> lock(_lock);
_fenceSitters.erase(fenceSitter);
}
void MVKFence::signal() {
lock_guard<mutex> lock(_lock);
if (_isSignaled) { return; } // Only signal once
_isSignaled = true;
// Notify all the fence sitters, and clear them from this instance.
for (auto& fs : _fenceSitters) {
fs->fenceSignaled(this);
}
_fenceSitters.clear();
}
void MVKFence::reset() {
lock_guard<mutex> lock(_lock);
_isSignaled = false;
_fenceSitters.clear();
}
bool MVKFence::getIsSignaled() {
lock_guard<mutex> lock(_lock);
return _isSignaled;
}
#pragma mark -
#pragma mark Support functions
VkResult mvkResetFences(uint32_t fenceCount, const VkFence* pFences) {
for (uint32_t i = 0; i < fenceCount; i++) {
((MVKFence*)pFences[i])->reset();
}
return VK_SUCCESS;
}
// Create a blocking fence sitter, add it to each fence, wait, then remove it.
VkResult mvkWaitForFences(MVKDevice* device,
uint32_t fenceCount,
const VkFence* pFences,
VkBool32 waitAll,
uint64_t timeout) {
VkResult rslt = VK_SUCCESS;
MVKFenceSitter fenceSitter(waitAll);
for (uint32_t i = 0; i < fenceCount; i++) {
((MVKFence*)pFences[i])->addSitter(&fenceSitter);
}
if ( !fenceSitter.wait(timeout) ) {
rslt = VK_TIMEOUT;
if (timeout > 0) {
device->reportError(rslt, "Vulkan fence timeout after %llu nanoseconds.", timeout);
}
}
for (uint32_t i = 0; i < fenceCount; i++) {
((MVKFence*)pFences[i])->removeSitter(&fenceSitter);
}
return rslt;
}
#pragma mark -
#pragma mark MVKMetalCompiler
// Create a compiled object by dispatching the block to the default global dispatch queue, and waiting only as long
// as the MVKConfiguration::metalCompileTimeout value. If the timeout is triggered, a Vulkan error is created.
// This approach is used to limit the lengthy time (30+ seconds!) consumed by Metal when it's internal compiler fails.
// The thread dispatch is needed because even the sync portion of the async Metal compilation methods can take well
// over a second to return when a compiler failure occurs!
void MVKMetalCompiler::compile(unique_lock<mutex>& lock, dispatch_block_t block) {
MVKAssert( _startTime == 0, "%s compile occurred already in this instance. Instances of %s should only be used for a single compile activity.", _compilerType.c_str(), getClassName().c_str());
MVKDevice* mvkDev = _owner->getDevice();
_startTime = mvkDev->getPerformanceTimestamp();
dispatch_async(dispatch_get_global_queue(DISPATCH_QUEUE_PRIORITY_DEFAULT, 0), block);
// Limit timeout to avoid overflow since wait_for() uses wait_until()
chrono::nanoseconds nanoTimeout(min(mvkDev->_pMVKConfig->metalCompileTimeout, kMVKUndefinedLargeUInt64));
_blocker.wait_for(lock, nanoTimeout, [this]{ return _isCompileDone; });
if ( !_isCompileDone ) {
NSString* errDesc = [NSString stringWithFormat: @"Timeout after %.3f milliseconds. Likely internal Metal compiler error", (double)nanoTimeout.count() / 1e6];
_compileError = [[NSError alloc] initWithDomain: @"MoltenVK" code: 1 userInfo: @{NSLocalizedDescriptionKey : errDesc}]; // retained
}
if (_compileError) { handleError(); }
mvkDev->addActivityPerformance(*_pPerformanceTracker, _startTime);
}
void MVKMetalCompiler::handleError() {
_owner->setConfigurationResult(reportError(VK_ERROR_INITIALIZATION_FAILED,
"%s compile failed (Error code %li):\n%s.",
_compilerType.c_str(), (long)_compileError.code,
_compileError.localizedDescription.UTF8String));
}
// Returns whether the compilation came in late, after the compiler was destroyed.
bool MVKMetalCompiler::endCompile(NSError* compileError) {
_compileError = [compileError retain]; // retained
_isCompileDone = true;
_blocker.notify_all();
return _isDestroyed;
}
void MVKMetalCompiler::destroy() {
if (markDestroyed()) { MVKBaseObject::destroy(); }
}
// Marks this object as destroyed, and returns whether the compilation is complete.
bool MVKMetalCompiler::markDestroyed() {
lock_guard<mutex> lock(_completionLock);
_isDestroyed = true;
return _isCompileDone;
}
#pragma mark Construction
MVKMetalCompiler::~MVKMetalCompiler() {
[_compileError release];
}