mirror of
https://github.com/doitsujin/dxvk.git
synced 2025-03-06 20:58:37 +01:00
[d3d11] Embed UpdateBuffer data in CS chunk
Tiny optimization that gets rid of a copy and also lets us use chunk memory more efficiently.
This commit is contained in:
parent
5b68884fd9
commit
416f9c5a4a
1 changed files with 13 additions and 7 deletions
|
@ -5507,19 +5507,25 @@ namespace dxvk {
|
|||
if (Length <= MaxDirectUpdateSize && !((Offset | Length) & 0x3)) {
|
||||
// The backend has special code paths for small buffer updates,
|
||||
// however both offset and size must be aligned to four bytes.
|
||||
std::array<char, MaxDirectUpdateSize> data;
|
||||
std::memcpy(data.data(), pSrcData, Length);
|
||||
// Write the data directly to the CS chunk.
|
||||
uint32_t dwordCount = Length / sizeof(uint32_t);
|
||||
|
||||
EmitCs([
|
||||
cBufferData = data,
|
||||
EmitCsCmd<uint32_t>(D3D11CmdType::None, dwordCount, [
|
||||
cBufferSlice = std::move(bufferSlice)
|
||||
] (DxvkContext* ctx) {
|
||||
] (DxvkContext* ctx, const uint32_t* data, size_t) {
|
||||
ctx->updateBuffer(
|
||||
cBufferSlice.buffer(),
|
||||
cBufferSlice.offset(),
|
||||
cBufferSlice.length(),
|
||||
cBufferData.data());
|
||||
cBufferSlice.length(), data);
|
||||
});
|
||||
|
||||
// Compiler should be able to vectorize here, but GCC only does
|
||||
// if we cast the destination pointer to the correct type first
|
||||
auto src = reinterpret_cast<const uint32_t*>(pSrcData);
|
||||
auto dst = reinterpret_cast<uint32_t*>(m_csData->first());
|
||||
|
||||
for (uint32_t i = 0; i < dwordCount; i++)
|
||||
new (dst + i) uint32_t(src[i]);
|
||||
} else {
|
||||
// Write directly to a staging buffer and dispatch a copy
|
||||
DxvkBufferSlice stagingSlice = AllocStagingBuffer(Length);
|
||||
|
|
Loading…
Add table
Reference in a new issue