diff options
author | V3n3RiX <venerix@redcorelinux.org> | 2019-10-13 22:19:36 +0100 |
---|---|---|
committer | V3n3RiX <venerix@redcorelinux.org> | 2019-10-14 23:22:23 +0100 |
commit | 4b19be30aa626b327c885dae62c559ec0e9fb935 (patch) | |
tree | 76e74807bc479502e13866b581b6bf86734ec634 /dev-libs/rocr-runtime/files | |
parent | 30d6f67c98d149508509d5e86f176d558793acc0 (diff) |
gentoo resync : 13.10.2019
Diffstat (limited to 'dev-libs/rocr-runtime/files')
-rw-r--r-- | dev-libs/rocr-runtime/files/rocr-runtime-2.8.0-fix_doorbell_map.patch | 57 |
1 files changed, 57 insertions, 0 deletions
diff --git a/dev-libs/rocr-runtime/files/rocr-runtime-2.8.0-fix_doorbell_map.patch b/dev-libs/rocr-runtime/files/rocr-runtime-2.8.0-fix_doorbell_map.patch new file mode 100644 index 000000000000..aef3d297034e --- /dev/null +++ b/dev-libs/rocr-runtime/files/rocr-runtime-2.8.0-fix_doorbell_map.patch @@ -0,0 +1,57 @@ +https://github.com/RadeonOpenCompute/ROCR-Runtime/pull/71 + +From d2a6ad97eb96a28d8f8b658b26ab94e911886cf2 Mon Sep 17 00:00:00 2001 +From: Sean Keely <Sean.Keely@amd.com> +Date: Thu, 5 Sep 2019 20:58:57 -0500 +Subject: [PATCH] Correct doorbell_queue_map allocation. + +doorbell_queue_map should be allocated unconditionally. +--- + core/runtime/amd_gpu_agent.cpp | 22 +++++++++++----------- + 1 file changed, 11 insertions(+), 11 deletions(-) + +diff --git a/core/runtime/amd_gpu_agent.cpp b/core/runtime/amd_gpu_agent.cpp +index 9b79a6b..76df913 100644 +--- a/core/runtime/amd_gpu_agent.cpp ++++ b/core/runtime/amd_gpu_agent.cpp +@@ -1182,12 +1182,22 @@ void GpuAgent::SyncClocks() { + } + + void GpuAgent::BindTrapHandler() { ++ // Make an empty map from doorbell index to queue. ++ // The trap handler uses this to retrieve a wave's amd_queue_t*. ++ auto doorbell_queue_map_size = MAX_NUM_DOORBELLS * sizeof(amd_queue_t*); ++ ++ doorbell_queue_map_ = (amd_queue_t**)core::Runtime::runtime_singleton_->system_allocator()( ++ doorbell_queue_map_size, 0x1000, 0); ++ assert(doorbell_queue_map_ != NULL && "Doorbell queue map allocation failed"); ++ ++ memset(doorbell_queue_map_, 0, doorbell_queue_map_size); ++ + if (isa_->GetMajorVersion() == 7) { + // No trap handler support on Gfx7, soft error. + return; + } + +- // Disable trap handler on Carrizo until KFD is fixed. ++ // Disable trap handler on APUs until KFD is fixed. + if (profile_ == HSA_PROFILE_FULL) { + return; + } +@@ -1195,16 +1205,6 @@ void GpuAgent::BindTrapHandler() { + // Assemble the trap handler source code. + AssembleShader("TrapHandler", AssembleTarget::ISA, trap_code_buf_, trap_code_buf_size_); + +- // Make an empty map from doorbell index to queue. +- // The trap handler uses this to retrieve a wave's amd_queue_t*. +- auto doorbell_queue_map_size = MAX_NUM_DOORBELLS * sizeof(amd_queue_t*); +- +- doorbell_queue_map_ = (amd_queue_t**)core::Runtime::runtime_singleton_->system_allocator()( +- doorbell_queue_map_size, 0x1000, 0); +- assert(doorbell_queue_map_ != NULL && "Doorbell queue map allocation failed"); +- +- memset(doorbell_queue_map_, 0, doorbell_queue_map_size); +- + // Bind the trap handler to this node. + HSAKMT_STATUS err = hsaKmtSetTrapHandler(node_id(), trap_code_buf_, trap_code_buf_size_, + doorbell_queue_map_, doorbell_queue_map_size); |