1
0
mirror of https://github.com/doitsujin/dxvk.git synced 2024-12-02 10:24:12 +01:00

[dxvk] Implemented staging buffers for large data transfers

This commit is contained in:
Philip Rebohle 2017-12-10 15:57:51 +01:00
parent 89ec199c34
commit 52f1c4fa00
17 changed files with 428 additions and 25 deletions

View File

@ -1169,8 +1169,21 @@ namespace dxvk {
subresources.layerCount = image->info().numLayers;
m_resourceInitContext->initImage(image, subresources);
if (pInitialData != nullptr)
Logger::err("D3D11: InitTexture cannot upload image data yet");
if (pInitialData != nullptr) {
VkImageSubresourceLayers subresourceLayers;
subresourceLayers.aspectMask = subresources.aspectMask;
subresourceLayers.mipLevel = 0;
subresourceLayers.baseArrayLayer = 0;
subresourceLayers.layerCount = subresources.layerCount;
m_resourceInitContext->updateImage(
image, subresourceLayers,
VkOffset3D { 0, 0, 0 },
image->info().extent,
pInitialData->pSysMem,
pInitialData->SysMemPitch,
pInitialData->SysMemSlicePitch);
}
m_dxvkDevice->submitCommandList(
m_resourceInitContext->endRecording(),

View File

@ -22,7 +22,7 @@ namespace dxvk {
// Create swap chain for the surface
DxvkSwapchainProperties swapchainProperties;
swapchainProperties.preferredSurfaceFormat = this->pickFormat(bufferFormat);
swapchainProperties.preferredPresentMode = VK_PRESENT_MODE_IMMEDIATE_KHR;
swapchainProperties.preferredPresentMode = VK_PRESENT_MODE_FIFO_KHR;
swapchainProperties.preferredBufferSize.width = bufferWidth;
swapchainProperties.preferredBufferSize.height = bufferHeight;
@ -206,7 +206,7 @@ namespace dxvk {
DXGI_FORMAT bufferFormat) {
DxvkSwapchainProperties swapchainProperties;
swapchainProperties.preferredSurfaceFormat = this->pickFormat(bufferFormat);
swapchainProperties.preferredPresentMode = VK_PRESENT_MODE_IMMEDIATE_KHR;
swapchainProperties.preferredPresentMode = VK_PRESENT_MODE_FIFO_KHR;
swapchainProperties.preferredBufferSize.width = bufferWidth;
swapchainProperties.preferredBufferSize.height = bufferHeight;

View File

@ -47,11 +47,11 @@ namespace dxvk {
/**
* \brief DXVK buffer
* \brief Buffer resource
*
* A simple buffer resource that stores
* linear data. Can be mapped to host
* memory.
* A simple buffer resource that stores linear,
* unformatted data. Can be accessed by the host
* if allocated on an appropriate memory type.
*/
class DxvkBuffer : public DxvkResource {
@ -86,10 +86,11 @@ namespace dxvk {
* If the buffer has been created on a host-visible
* memory type, the buffer memory is mapped and can
* be accessed by the host.
* \param [in] offset Byte offset into mapped region
* \returns Pointer to mapped memory region
*/
void* mapPtr() const {
return m_memory.mapPtr();
void* mapPtr(VkDeviceSize offset) const {
return m_memory.mapPtr(offset);
}
private:

View File

@ -4,8 +4,9 @@ namespace dxvk {
DxvkCommandList::DxvkCommandList(
const Rc<vk::DeviceFn>& vkd,
DxvkDevice* device,
uint32_t queueFamily)
: m_vkd(vkd), m_descAlloc(vkd) {
: m_vkd(vkd), m_descAlloc(vkd), m_stagingAlloc(device) {
VkCommandPoolCreateInfo poolInfo;
poolInfo.sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO;
poolInfo.pNext = nullptr;
@ -28,7 +29,7 @@ namespace dxvk {
DxvkCommandList::~DxvkCommandList() {
m_resources.reset();
this->reset();
m_vkd->vkDestroyCommandPool(
m_vkd->device(), m_pool, nullptr);
@ -86,6 +87,7 @@ namespace dxvk {
void DxvkCommandList::reset() {
m_stagingAlloc.reset();
m_descAlloc.reset();
m_resources.reset();
}
@ -299,4 +301,35 @@ namespace dxvk {
firstViewport, viewportCount, viewports);
}
DxvkStagingBufferSlice DxvkCommandList::stagedAlloc(VkDeviceSize size) {
return m_stagingAlloc.alloc(size);
}
void DxvkCommandList::stagedBufferCopy(
VkBuffer dstBuffer,
VkDeviceSize dstOffset,
VkDeviceSize dataSize,
const DxvkStagingBufferSlice& dataSlice) {
VkBufferCopy region;
region.srcOffset = dataSlice.offset;
region.dstOffset = dstOffset;
region.size = dataSize;
m_vkd->vkCmdCopyBuffer(m_buffer,
dataSlice.buffer, dstBuffer, 1, &region);
}
void DxvkCommandList::stagedBufferImageCopy(
VkImage dstImage,
VkImageLayout dstImageLayout,
const VkBufferImageCopy& dstImageRegion,
const DxvkStagingBufferSlice& dataSlice) {
m_vkd->vkCmdCopyBufferToImage(m_buffer,
dataSlice.buffer, dstImage, dstImageLayout,
1, &dstImageRegion);
}
}

View File

@ -5,6 +5,7 @@
#include "dxvk_descriptor.h"
#include "dxvk_lifetime.h"
#include "dxvk_pipelayout.h"
#include "dxvk_staging.h"
namespace dxvk {
@ -23,6 +24,7 @@ namespace dxvk {
DxvkCommandList(
const Rc<vk::DeviceFn>& vkd,
DxvkDevice* device,
uint32_t queueFamily);
~DxvkCommandList();
@ -177,6 +179,21 @@ namespace dxvk {
uint32_t viewportCount,
const VkViewport* viewports);
DxvkStagingBufferSlice stagedAlloc(
VkDeviceSize size);
void stagedBufferCopy(
VkBuffer dstBuffer,
VkDeviceSize dstOffset,
VkDeviceSize dataSize,
const DxvkStagingBufferSlice& dataSlice);
void stagedBufferImageCopy(
VkImage dstImage,
VkImageLayout dstImageLayout,
const VkBufferImageCopy& dstImageRegion,
const DxvkStagingBufferSlice& dataSlice);
private:
Rc<vk::DeviceFn> m_vkd;
@ -186,8 +203,7 @@ namespace dxvk {
DxvkLifetimeTracker m_resources;
DxvkDescriptorAlloc m_descAlloc;
std::vector<VkWriteDescriptorSet> m_descriptorSetWrites;
DxvkStagingAlloc m_stagingAlloc;
};

View File

@ -1,3 +1,5 @@
#include <cstring>
#include "dxvk_device.h"
#include "dxvk_context.h"
#include "dxvk_main.h"
@ -374,16 +376,23 @@ namespace dxvk {
this->renderPassEnd();
if (size == VK_WHOLE_SIZE)
size = buffer->info().size;
size = buffer->info().size - offset;
if (size != 0) {
// Vulkan specifies that small amounts of data (up to 64kB)
// can be copied to a buffer directly. Anything larger than
// that must be copied through a staging buffer.
if (size <= 65536) {
m_cmd->cmdUpdateBuffer(
buffer->handle(),
offset, size, data);
} else {
// TODO implement
Logger::err("DxvkContext::updateBuffer: Large updates not yet supported");
auto slice = m_cmd->stagedAlloc(size);
std::memcpy(slice.mapPtr, data, size);
m_cmd->stagedBufferCopy(
buffer->handle(),
offset, size, slice);
}
m_barriers.accessBuffer(
@ -393,10 +402,103 @@ namespace dxvk {
buffer->info().stages,
buffer->info().access);
m_barriers.recordCommands(m_cmd);
m_cmd->trackResource(buffer);
}
}
void DxvkContext::updateImage(
const Rc<DxvkImage>& image,
const VkImageSubresourceLayers& subresources,
VkOffset3D imageOffset,
VkExtent3D imageExtent,
const void* data,
VkDeviceSize pitchPerRow,
VkDeviceSize pitchPerLayer) {
if (subresources.layerCount == 0) {
Logger::warn("DxvkContext::updateImage: Layer count is zero");
return;
}
VkImageSubresourceRange subresourceRange;
subresourceRange.aspectMask = subresources.aspectMask;
subresourceRange.baseMipLevel = subresources.mipLevel;
subresourceRange.levelCount = 1;
subresourceRange.baseArrayLayer = subresources.baseArrayLayer;
subresourceRange.layerCount = subresources.layerCount;
m_barriers.accessImage(
image, subresourceRange,
image->info().extent == imageExtent
? VK_IMAGE_LAYOUT_UNDEFINED
: image->info().layout,
image->info().stages,
image->info().access,
VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL,
VK_PIPELINE_STAGE_TRANSFER_BIT,
VK_ACCESS_TRANSFER_WRITE_BIT);
m_barriers.recordCommands(m_cmd);
// TODO support block formats properly
const DxvkFormatInfo* formatInfo
= imageFormatInfo(image->info().format);
const VkDeviceSize layerCount = imageExtent.depth * subresources.layerCount;
VkDeviceSize bytesPerRow = imageExtent.width * formatInfo->elementSize;
VkDeviceSize bytesPerLayer = imageExtent.height * bytesPerRow;
VkDeviceSize bytesTotal = layerCount * bytesPerLayer;
auto slice = m_cmd->stagedAlloc(bytesTotal);
auto dstData = reinterpret_cast<char*>(slice.mapPtr);
auto srcData = reinterpret_cast<const char*>(data);
bool useDirectCopy = true;
useDirectCopy &= (pitchPerLayer == bytesPerLayer) || layerCount == 1;
useDirectCopy &= (pitchPerRow == bytesPerRow) || imageExtent.height == 1;
if (useDirectCopy) {
std::memcpy(dstData, srcData, bytesTotal);
} else {
for (uint32_t i = 0; i < layerCount; i++) {
for (uint32_t j = 0; j < imageExtent.height; j++) {
std::memcpy(dstData, srcData, bytesPerRow);
dstData += bytesPerRow;
srcData += pitchPerRow;
}
dstData += bytesPerLayer;
srcData += pitchPerLayer;
}
}
VkBufferImageCopy region;
region.bufferOffset = slice.offset;
region.bufferRowLength = 0;
region.bufferImageHeight = 0;
region.imageSubresource = subresources;
region.imageOffset = imageOffset;
region.imageExtent = imageExtent;
m_cmd->stagedBufferImageCopy(image->handle(),
VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL,
region, slice);
m_barriers.accessImage(
image, subresourceRange,
VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL,
VK_PIPELINE_STAGE_TRANSFER_BIT,
VK_ACCESS_TRANSFER_WRITE_BIT,
image->info().layout,
image->info().stages,
image->info().access);
m_barriers.recordCommands(m_cmd);
m_cmd->trackResource(image);
}
void DxvkContext::setViewports(
uint32_t viewportCount,
const VkViewport* viewports,

View File

@ -262,6 +262,27 @@ namespace dxvk {
VkDeviceSize size,
const void* data);
/**
* \brief Updates an image
*
* Copies data from the host into an image.
* \param [in] image Destination image
* \param [in] subsresources Image subresources to update
* \param [in] imageOffset Offset of the image area to update
* \param [in] imageExtent Size of the image area to update
* \param [in] data Source data
* \param [in] pitchPerRow Row pitch of the source data
* \param [in] pitchPerLayer Layer pitch of the source data
*/
void updateImage(
const Rc<DxvkImage>& image,
const VkImageSubresourceLayers& subresources,
VkOffset3D imageOffset,
VkExtent3D imageExtent,
const void* data,
VkDeviceSize pitchPerRow,
VkDeviceSize pitchPerLayer);
/**
* \brief Sets viewports
*

View File

@ -32,8 +32,34 @@ namespace dxvk {
}
Rc<DxvkStagingBuffer> DxvkDevice::allocStagingBuffer(VkDeviceSize size) {
// TODO actually recycle old buffers
const VkDeviceSize baseSize = 64 * 1024 * 1024;
const VkDeviceSize bufferSize = std::max(baseSize, size);
DxvkBufferCreateInfo info;
info.size = bufferSize;
info.usage = VK_BUFFER_USAGE_TRANSFER_SRC_BIT;
info.stages = VK_PIPELINE_STAGE_TRANSFER_BIT
| VK_PIPELINE_STAGE_HOST_BIT;
info.access = VK_ACCESS_TRANSFER_READ_BIT
| VK_ACCESS_HOST_WRITE_BIT;
VkMemoryPropertyFlags memFlags
= VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT
| VK_MEMORY_PROPERTY_HOST_COHERENT_BIT;
return new DxvkStagingBuffer(this->createBuffer(info, memFlags));
}
void DxvkDevice::recycleStagingBuffer(const Rc<DxvkStagingBuffer>& buffer) {
// TODO implement
}
Rc<DxvkCommandList> DxvkDevice::createCommandList() {
return new DxvkCommandList(m_vkd,
return new DxvkCommandList(m_vkd, this,
m_adapter->graphicsQueueFamily());
}

View File

@ -73,6 +73,29 @@ namespace dxvk {
return m_features;
}
/**
* \brief Allocates a staging buffer
*
* Returns a staging buffer that is at least as large
* as the requested size. It is usually bigger so that
* a single staging buffer may serve multiple allocations.
* \param [in] size Minimum buffer size
* \returns The staging buffer
*/
Rc<DxvkStagingBuffer> allocStagingBuffer(
VkDeviceSize size);
/**
* \brief Recycles a staging buffer
*
* When a staging buffer is no longer needed, it should
* be returned to the device so that it can be reused
* for subsequent allocations.
* \param [in] buffer The buffer
*/
void recycleStagingBuffer(
const Rc<DxvkStagingBuffer>& buffer);
/**
* \brief Creates a command list
* \returns The command list

View File

@ -12,7 +12,7 @@ namespace dxvk {
*/
struct DxvkFormatInfo {
/// Size of an element in this format
uint32_t byteSize;
VkDeviceSize elementSize;
/// Available image aspect flags
VkImageAspectFlags aspectMask;

View File

@ -78,8 +78,8 @@ namespace dxvk {
* \brief DXVK image
*
* An image resource consisting of various subresources.
* Cannot be mapped to host memory, the only way to access
* image data is through buffer transfer operations.
* Can be accessed by the host if allocated on a suitable
* memory type and if created with the linear tiling option.
*/
class DxvkImage : public DxvkResource {

View File

@ -47,10 +47,12 @@ namespace dxvk {
/**
* \brief Pointer to mapped data
*
* \param [in] offset Byte offset
* \returns Pointer to mapped data
*/
void* mapPtr() const {
return m_mapPtr;
void* mapPtr(VkDeviceSize offset) const {
return reinterpret_cast<char*>(m_mapPtr) + offset;
}
private:

85
src/dxvk/dxvk_staging.cpp Normal file
View File

@ -0,0 +1,85 @@
#include "dxvk_device.h"
#include "dxvk_staging.h"
namespace dxvk {
DxvkStagingBuffer::DxvkStagingBuffer(
const Rc<DxvkBuffer>& buffer)
: m_buffer(buffer), m_bufferSize(buffer->info().size){
}
DxvkStagingBuffer::~DxvkStagingBuffer() {
}
VkDeviceSize DxvkStagingBuffer::freeBytes() const {
return m_bufferSize - m_bufferOffset;
}
bool DxvkStagingBuffer::alloc(
VkDeviceSize size,
DxvkStagingBufferSlice& slice) {
if (m_bufferOffset + size > m_bufferSize)
return false;
slice.buffer = m_buffer->handle();
slice.offset = m_bufferOffset;
slice.mapPtr = m_buffer->mapPtr(m_bufferOffset);
m_bufferOffset += size;
return true;
}
void DxvkStagingBuffer::reset() {
m_bufferOffset = 0;
}
DxvkStagingAlloc::DxvkStagingAlloc(DxvkDevice* device)
: m_device(device) { }
DxvkStagingAlloc::~DxvkStagingAlloc() {
this->reset();
}
DxvkStagingBufferSlice DxvkStagingAlloc::alloc(VkDeviceSize size) {
Rc<DxvkStagingBuffer> selectedBuffer;
// Try a worst-fit allocation strategy on the existing staging
// buffers first. This should keep the amount of wasted space
// small, especially if there are large allocations.
for (const auto& buf : m_stagingBuffers) {
if (selectedBuffer == nullptr || (buf->freeBytes() > selectedBuffer->freeBytes()))
selectedBuffer = buf;
}
// If we have no suitable buffer, allocate one from the device
// that is *at least* as large as the amount of data we need
// to upload. Usually it will be bigger.
DxvkStagingBufferSlice slice;
if ((selectedBuffer == nullptr) || (!selectedBuffer->alloc(size, slice))) {
selectedBuffer = m_device->allocStagingBuffer(size);
selectedBuffer->alloc(size, slice);
m_stagingBuffers.push_back(selectedBuffer);
}
return slice;
}
void DxvkStagingAlloc::reset() {
for (const auto& buf : m_stagingBuffers)
m_device->recycleStagingBuffer(buf);
m_stagingBuffers.resize(0);
}
}

63
src/dxvk/dxvk_staging.h Normal file
View File

@ -0,0 +1,63 @@
#pragma once
#include "dxvk_buffer.h"
namespace dxvk {
class DxvkDevice;
struct DxvkStagingBufferSlice {
VkBuffer buffer = VK_NULL_HANDLE;
VkDeviceSize offset = 0;
void* mapPtr = nullptr;
};
class DxvkStagingBuffer : public RcObject {
public:
DxvkStagingBuffer(
const Rc<DxvkBuffer>& buffer);
~DxvkStagingBuffer();
VkDeviceSize freeBytes() const;
bool alloc(
VkDeviceSize size,
DxvkStagingBufferSlice& slice);
void reset();
private:
Rc<DxvkBuffer> m_buffer;
VkDeviceSize m_bufferSize = 0;
VkDeviceSize m_bufferOffset = 0;
};
class DxvkStagingAlloc {
public:
DxvkStagingAlloc(DxvkDevice* device);
~DxvkStagingAlloc();
DxvkStagingBufferSlice alloc(
VkDeviceSize size);
void reset();
private:
DxvkDevice* const m_device;
std::vector<Rc<DxvkStagingBuffer>> m_stagingBuffers;
};
}

View File

@ -20,4 +20,17 @@ namespace dxvk::util {
return result;
}
}
}
bool operator == (VkExtent3D a, VkExtent3D b) {
return a.width == b.width
&& a.height == b.height
&& a.depth == b.depth;
}
bool operator != (VkExtent3D a, VkExtent3D b) {
return a.width != b.width
|| a.height != b.height
|| a.depth != b.depth;
}

View File

@ -13,4 +13,8 @@ namespace dxvk::util {
VkPipelineStageFlags pipelineStages(
VkShaderStageFlags shaderStages);
}
}
bool operator == (VkExtent3D a, VkExtent3D b);
bool operator != (VkExtent3D a, VkExtent3D b);

View File

@ -22,6 +22,7 @@ dxvk_src = files([
'dxvk_resource.cpp',
'dxvk_sampler.cpp',
'dxvk_shader.cpp',
'dxvk_staging.cpp',
'dxvk_surface.cpp',
'dxvk_swapchain.cpp',
'dxvk_sync.cpp',