| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477 |
- // Copyright (c) 2017 The Khronos Group Inc.
- // Copyright (c) 2017 Valve Corporation
- // Copyright (c) 2017 LunarG Inc.
- // Modifications Copyright (C) 2024 Advanced Micro Devices, Inc. All rights
- // reserved.
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- #include "source/opt/local_access_chain_convert_pass.h"
- #include "ir_context.h"
- #include "iterator.h"
- #include "source/util/string_utils.h"
- namespace spvtools {
- namespace opt {
- namespace {
- constexpr uint32_t kStoreValIdInIdx = 1;
- constexpr uint32_t kAccessChainPtrIdInIdx = 0;
- } // namespace
- void LocalAccessChainConvertPass::BuildAndAppendInst(
- spv::Op opcode, uint32_t typeId, uint32_t resultId,
- const std::vector<Operand>& in_opnds,
- std::vector<std::unique_ptr<Instruction>>* newInsts) {
- std::unique_ptr<Instruction> newInst(
- new Instruction(context(), opcode, typeId, resultId, in_opnds));
- get_def_use_mgr()->AnalyzeInstDefUse(&*newInst);
- newInsts->emplace_back(std::move(newInst));
- }
- uint32_t LocalAccessChainConvertPass::BuildAndAppendVarLoad(
- const Instruction* ptrInst, uint32_t* varId, uint32_t* varPteTypeId,
- std::vector<std::unique_ptr<Instruction>>* newInsts) {
- const uint32_t ldResultId = TakeNextId();
- if (ldResultId == 0) {
- return 0;
- }
- *varId = ptrInst->GetSingleWordInOperand(kAccessChainPtrIdInIdx);
- const Instruction* varInst = get_def_use_mgr()->GetDef(*varId);
- assert(varInst->opcode() == spv::Op::OpVariable);
- *varPteTypeId = GetPointeeTypeId(varInst);
- BuildAndAppendInst(spv::Op::OpLoad, *varPteTypeId, ldResultId,
- {{spv_operand_type_t::SPV_OPERAND_TYPE_ID, {*varId}}},
- newInsts);
- return ldResultId;
- }
- void LocalAccessChainConvertPass::AppendConstantOperands(
- const Instruction* ptrInst, std::vector<Operand>* in_opnds) {
- uint32_t iidIdx = 0;
- ptrInst->ForEachInId([&iidIdx, &in_opnds, this](const uint32_t* iid) {
- if (iidIdx > 0) {
- const Instruction* cInst = get_def_use_mgr()->GetDef(*iid);
- const auto* constant_value =
- context()->get_constant_mgr()->GetConstantFromInst(cInst);
- assert(constant_value != nullptr &&
- "Expecting the index to be a constant.");
- // We take the sign extended value because OpAccessChain interprets the
- // index as signed.
- int64_t long_value = constant_value->GetSignExtendedValue();
- assert(long_value <= UINT32_MAX && long_value >= 0 &&
- "The index value is too large for a composite insert or extract "
- "instruction.");
- uint32_t val = static_cast<uint32_t>(long_value);
- in_opnds->push_back(
- {spv_operand_type_t::SPV_OPERAND_TYPE_LITERAL_INTEGER, {val}});
- }
- ++iidIdx;
- });
- }
- bool LocalAccessChainConvertPass::ReplaceAccessChainLoad(
- const Instruction* address_inst, Instruction* original_load) {
- // Build and append load of variable in ptrInst
- if (address_inst->NumInOperands() == 1) {
- // An access chain with no indices is essentially a copy. All that is
- // needed is to propagate the address.
- context()->ReplaceAllUsesWith(
- address_inst->result_id(),
- address_inst->GetSingleWordInOperand(kAccessChainPtrIdInIdx));
- return true;
- }
- std::vector<std::unique_ptr<Instruction>> new_inst;
- uint32_t varId;
- uint32_t varPteTypeId;
- const uint32_t ldResultId =
- BuildAndAppendVarLoad(address_inst, &varId, &varPteTypeId, &new_inst);
- if (ldResultId == 0) {
- return false;
- }
- new_inst[0]->UpdateDebugInfoFrom(original_load);
- context()->get_decoration_mgr()->CloneDecorations(
- original_load->result_id(), ldResultId,
- {spv::Decoration::RelaxedPrecision});
- original_load->InsertBefore(std::move(new_inst));
- context()->get_debug_info_mgr()->AnalyzeDebugInst(
- original_load->PreviousNode());
- // Rewrite |original_load| into an extract.
- Instruction::OperandList new_operands;
- // copy the result id and the type id to the new operand list.
- new_operands.emplace_back(original_load->GetOperand(0));
- new_operands.emplace_back(original_load->GetOperand(1));
- new_operands.emplace_back(
- Operand({spv_operand_type_t::SPV_OPERAND_TYPE_ID, {ldResultId}}));
- AppendConstantOperands(address_inst, &new_operands);
- original_load->SetOpcode(spv::Op::OpCompositeExtract);
- original_load->ReplaceOperands(new_operands);
- context()->UpdateDefUse(original_load);
- return true;
- }
- bool LocalAccessChainConvertPass::GenAccessChainStoreReplacement(
- const Instruction* ptrInst, uint32_t valId,
- std::vector<std::unique_ptr<Instruction>>* newInsts) {
- if (ptrInst->NumInOperands() == 1) {
- // An access chain with no indices is essentially a copy. However, we still
- // have to create a new store because the old ones will be deleted.
- BuildAndAppendInst(
- spv::Op::OpStore, 0, 0,
- {{spv_operand_type_t::SPV_OPERAND_TYPE_ID,
- {ptrInst->GetSingleWordInOperand(kAccessChainPtrIdInIdx)}},
- {spv_operand_type_t::SPV_OPERAND_TYPE_ID, {valId}}},
- newInsts);
- return true;
- }
- // Build and append load of variable in ptrInst
- uint32_t varId;
- uint32_t varPteTypeId;
- const uint32_t ldResultId =
- BuildAndAppendVarLoad(ptrInst, &varId, &varPteTypeId, newInsts);
- if (ldResultId == 0) {
- return false;
- }
- context()->get_decoration_mgr()->CloneDecorations(
- varId, ldResultId, {spv::Decoration::RelaxedPrecision});
- // Build and append Insert
- const uint32_t insResultId = TakeNextId();
- if (insResultId == 0) {
- return false;
- }
- std::vector<Operand> ins_in_opnds = {
- {spv_operand_type_t::SPV_OPERAND_TYPE_ID, {valId}},
- {spv_operand_type_t::SPV_OPERAND_TYPE_ID, {ldResultId}}};
- AppendConstantOperands(ptrInst, &ins_in_opnds);
- BuildAndAppendInst(spv::Op::OpCompositeInsert, varPteTypeId, insResultId,
- ins_in_opnds, newInsts);
- context()->get_decoration_mgr()->CloneDecorations(
- varId, insResultId, {spv::Decoration::RelaxedPrecision});
- // Build and append Store
- BuildAndAppendInst(spv::Op::OpStore, 0, 0,
- {{spv_operand_type_t::SPV_OPERAND_TYPE_ID, {varId}},
- {spv_operand_type_t::SPV_OPERAND_TYPE_ID, {insResultId}}},
- newInsts);
- return true;
- }
- bool LocalAccessChainConvertPass::Is32BitConstantIndexAccessChain(
- const Instruction* acp) const {
- uint32_t inIdx = 0;
- return acp->WhileEachInId([&inIdx, this](const uint32_t* tid) {
- if (inIdx > 0) {
- Instruction* opInst = get_def_use_mgr()->GetDef(*tid);
- if (opInst->opcode() != spv::Op::OpConstant) return false;
- const auto* index =
- context()->get_constant_mgr()->GetConstantFromInst(opInst);
- int64_t index_value = index->GetSignExtendedValue();
- if (index_value > UINT32_MAX) return false;
- if (index_value < 0) return false;
- }
- ++inIdx;
- return true;
- });
- }
- bool LocalAccessChainConvertPass::HasOnlySupportedRefs(uint32_t ptrId) {
- if (supported_ref_ptrs_.find(ptrId) != supported_ref_ptrs_.end()) return true;
- if (get_def_use_mgr()->WhileEachUser(ptrId, [this](Instruction* user) {
- if (user->GetCommonDebugOpcode() == CommonDebugInfoDebugValue ||
- user->GetCommonDebugOpcode() == CommonDebugInfoDebugDeclare) {
- return true;
- }
- spv::Op op = user->opcode();
- if (IsNonPtrAccessChain(op) || op == spv::Op::OpCopyObject) {
- if (!HasOnlySupportedRefs(user->result_id())) {
- return false;
- }
- } else if (op != spv::Op::OpStore && op != spv::Op::OpLoad &&
- op != spv::Op::OpName && !IsNonTypeDecorate(op)) {
- return false;
- }
- return true;
- })) {
- supported_ref_ptrs_.insert(ptrId);
- return true;
- }
- return false;
- }
- void LocalAccessChainConvertPass::FindTargetVars(Function* func) {
- for (auto bi = func->begin(); bi != func->end(); ++bi) {
- for (auto ii = bi->begin(); ii != bi->end(); ++ii) {
- switch (ii->opcode()) {
- case spv::Op::OpStore:
- case spv::Op::OpLoad: {
- uint32_t varId;
- Instruction* ptrInst = GetPtr(&*ii, &varId);
- if (!IsTargetVar(varId)) break;
- const spv::Op op = ptrInst->opcode();
- // Rule out variables with non-supported refs eg function calls
- if (!HasOnlySupportedRefs(varId)) {
- seen_non_target_vars_.insert(varId);
- seen_target_vars_.erase(varId);
- break;
- }
- // Rule out variables with nested access chains
- // TODO(): Convert nested access chains
- bool is_non_ptr_access_chain = IsNonPtrAccessChain(op);
- if (is_non_ptr_access_chain && ptrInst->GetSingleWordInOperand(
- kAccessChainPtrIdInIdx) != varId) {
- seen_non_target_vars_.insert(varId);
- seen_target_vars_.erase(varId);
- break;
- }
- // Rule out variables accessed with non-constant indices
- if (!Is32BitConstantIndexAccessChain(ptrInst)) {
- seen_non_target_vars_.insert(varId);
- seen_target_vars_.erase(varId);
- break;
- }
- if (is_non_ptr_access_chain && AnyIndexIsOutOfBounds(ptrInst)) {
- seen_non_target_vars_.insert(varId);
- seen_target_vars_.erase(varId);
- break;
- }
- } break;
- default:
- break;
- }
- }
- }
- }
- Pass::Status LocalAccessChainConvertPass::ConvertLocalAccessChains(
- Function* func) {
- FindTargetVars(func);
- // Replace access chains of all targeted variables with equivalent
- // extract and insert sequences
- bool modified = false;
- for (auto bi = func->begin(); bi != func->end(); ++bi) {
- std::vector<Instruction*> dead_instructions;
- for (auto ii = bi->begin(); ii != bi->end(); ++ii) {
- switch (ii->opcode()) {
- case spv::Op::OpLoad: {
- uint32_t varId;
- Instruction* ptrInst = GetPtr(&*ii, &varId);
- if (!IsNonPtrAccessChain(ptrInst->opcode())) break;
- if (!IsTargetVar(varId)) break;
- if (!ReplaceAccessChainLoad(ptrInst, &*ii)) {
- return Status::Failure;
- }
- modified = true;
- } break;
- case spv::Op::OpStore: {
- uint32_t varId;
- Instruction* store = &*ii;
- Instruction* ptrInst = GetPtr(store, &varId);
- if (!IsNonPtrAccessChain(ptrInst->opcode())) break;
- if (!IsTargetVar(varId)) break;
- std::vector<std::unique_ptr<Instruction>> newInsts;
- uint32_t valId = store->GetSingleWordInOperand(kStoreValIdInIdx);
- if (!GenAccessChainStoreReplacement(ptrInst, valId, &newInsts)) {
- return Status::Failure;
- }
- size_t num_of_instructions_to_skip = newInsts.size() - 1;
- dead_instructions.push_back(store);
- ++ii;
- ii = ii.InsertBefore(std::move(newInsts));
- for (size_t i = 0; i < num_of_instructions_to_skip; ++i) {
- ii->UpdateDebugInfoFrom(store);
- context()->get_debug_info_mgr()->AnalyzeDebugInst(&*ii);
- ++ii;
- }
- ii->UpdateDebugInfoFrom(store);
- context()->get_debug_info_mgr()->AnalyzeDebugInst(&*ii);
- modified = true;
- } break;
- default:
- break;
- }
- }
- while (!dead_instructions.empty()) {
- Instruction* inst = dead_instructions.back();
- dead_instructions.pop_back();
- DCEInst(inst, [&dead_instructions](Instruction* other_inst) {
- auto i = std::find(dead_instructions.begin(), dead_instructions.end(),
- other_inst);
- if (i != dead_instructions.end()) {
- dead_instructions.erase(i);
- }
- });
- }
- }
- return (modified ? Status::SuccessWithChange : Status::SuccessWithoutChange);
- }
- void LocalAccessChainConvertPass::Initialize() {
- // Initialize Target Variable Caches
- seen_target_vars_.clear();
- seen_non_target_vars_.clear();
- // Initialize collections
- supported_ref_ptrs_.clear();
- // Initialize extension allowlist
- InitExtensions();
- }
- bool LocalAccessChainConvertPass::AllExtensionsSupported() const {
- // This capability can now exist without the extension, so we have to check
- // for the capability. This pass is only looking at function scope symbols,
- // so we do not care if there are variable pointers on storage buffers.
- if (context()->get_feature_mgr()->HasCapability(
- spv::Capability::VariablePointers))
- return false;
- // If any extension not in allowlist, return false
- for (auto& ei : get_module()->extensions()) {
- const std::string extName = ei.GetInOperand(0).AsString();
- if (extensions_allowlist_.find(extName) == extensions_allowlist_.end())
- return false;
- }
- // only allow NonSemantic.Shader.DebugInfo.100, we cannot safely optimise
- // around unknown extended
- // instruction sets even if they are non-semantic
- for (auto& inst : context()->module()->ext_inst_imports()) {
- assert(inst.opcode() == spv::Op::OpExtInstImport &&
- "Expecting an import of an extension's instruction set.");
- const std::string extension_name = inst.GetInOperand(0).AsString();
- if (spvtools::utils::starts_with(extension_name, "NonSemantic.") &&
- extension_name != "NonSemantic.Shader.DebugInfo.100") {
- return false;
- }
- }
- return true;
- }
- Pass::Status LocalAccessChainConvertPass::ProcessImpl() {
- // Do not process if module contains OpGroupDecorate. Additional
- // support required in KillNamesAndDecorates().
- // TODO(greg-lunarg): Add support for OpGroupDecorate
- for (auto& ai : get_module()->annotations())
- if (ai.opcode() == spv::Op::OpGroupDecorate)
- return Status::SuccessWithoutChange;
- // Do not process if any disallowed extensions are enabled
- if (!AllExtensionsSupported()) return Status::SuccessWithoutChange;
- // Process all functions in the module.
- Status status = Status::SuccessWithoutChange;
- for (Function& func : *get_module()) {
- status = CombineStatus(status, ConvertLocalAccessChains(&func));
- if (status == Status::Failure) {
- break;
- }
- }
- return status;
- }
- LocalAccessChainConvertPass::LocalAccessChainConvertPass() {}
- Pass::Status LocalAccessChainConvertPass::Process() {
- Initialize();
- return ProcessImpl();
- }
- void LocalAccessChainConvertPass::InitExtensions() {
- extensions_allowlist_.clear();
- extensions_allowlist_.insert(
- {"SPV_AMD_shader_explicit_vertex_parameter",
- "SPV_AMD_shader_trinary_minmax", "SPV_AMD_gcn_shader",
- "SPV_KHR_shader_ballot", "SPV_AMD_shader_ballot",
- "SPV_AMD_gpu_shader_half_float", "SPV_KHR_shader_draw_parameters",
- "SPV_KHR_subgroup_vote", "SPV_KHR_8bit_storage", "SPV_KHR_16bit_storage",
- "SPV_KHR_device_group", "SPV_KHR_multiview",
- "SPV_NVX_multiview_per_view_attributes", "SPV_NV_viewport_array2",
- "SPV_NV_stereo_view_rendering", "SPV_NV_sample_mask_override_coverage",
- "SPV_NV_geometry_shader_passthrough", "SPV_AMD_texture_gather_bias_lod",
- "SPV_KHR_storage_buffer_storage_class",
- // SPV_KHR_variable_pointers
- // Currently do not support extended pointer expressions
- "SPV_AMD_gpu_shader_int16", "SPV_KHR_post_depth_coverage",
- "SPV_KHR_shader_atomic_counter_ops", "SPV_EXT_shader_stencil_export",
- "SPV_EXT_shader_viewport_index_layer",
- "SPV_AMD_shader_image_load_store_lod", "SPV_AMD_shader_fragment_mask",
- "SPV_EXT_fragment_fully_covered", "SPV_AMD_gpu_shader_half_float_fetch",
- "SPV_GOOGLE_decorate_string", "SPV_GOOGLE_hlsl_functionality1",
- "SPV_GOOGLE_user_type", "SPV_NV_shader_subgroup_partitioned",
- "SPV_EXT_demote_to_helper_invocation", "SPV_EXT_descriptor_indexing",
- "SPV_NV_fragment_shader_barycentric",
- "SPV_NV_compute_shader_derivatives", "SPV_NV_shader_image_footprint",
- "SPV_NV_shading_rate", "SPV_NV_mesh_shader", "SPV_EXT_mesh_shader",
- "SPV_NV_ray_tracing", "SPV_KHR_ray_tracing", "SPV_KHR_ray_query",
- "SPV_EXT_fragment_invocation_density", "SPV_KHR_terminate_invocation",
- "SPV_KHR_subgroup_uniform_control_flow", "SPV_KHR_integer_dot_product",
- "SPV_EXT_shader_image_int64", "SPV_KHR_non_semantic_info",
- "SPV_KHR_uniform_group_instructions",
- "SPV_KHR_fragment_shader_barycentric", "SPV_KHR_vulkan_memory_model",
- "SPV_NV_bindless_texture", "SPV_EXT_shader_atomic_float_add",
- "SPV_EXT_fragment_shader_interlock",
- "SPV_KHR_compute_shader_derivatives", "SPV_NV_cooperative_matrix",
- "SPV_KHR_cooperative_matrix", "SPV_KHR_ray_tracing_position_fetch",
- "SPV_AMDX_shader_enqueue", "SPV_KHR_fragment_shading_rate"});
- }
- bool LocalAccessChainConvertPass::AnyIndexIsOutOfBounds(
- const Instruction* access_chain_inst) {
- assert(IsNonPtrAccessChain(access_chain_inst->opcode()));
- analysis::TypeManager* type_mgr = context()->get_type_mgr();
- analysis::ConstantManager* const_mgr = context()->get_constant_mgr();
- auto constants = const_mgr->GetOperandConstants(access_chain_inst);
- uint32_t base_pointer_id = access_chain_inst->GetSingleWordInOperand(0);
- Instruction* base_pointer = get_def_use_mgr()->GetDef(base_pointer_id);
- const analysis::Pointer* base_pointer_type =
- type_mgr->GetType(base_pointer->type_id())->AsPointer();
- assert(base_pointer_type != nullptr &&
- "The base of the access chain is not a pointer.");
- const analysis::Type* current_type = base_pointer_type->pointee_type();
- for (uint32_t i = 1; i < access_chain_inst->NumInOperands(); ++i) {
- if (IsIndexOutOfBounds(constants[i], current_type)) {
- return true;
- }
- uint32_t index =
- (constants[i]
- ? static_cast<uint32_t>(constants[i]->GetZeroExtendedValue())
- : 0);
- current_type = type_mgr->GetMemberType(current_type, {index});
- }
- return false;
- }
- bool LocalAccessChainConvertPass::IsIndexOutOfBounds(
- const analysis::Constant* index, const analysis::Type* type) const {
- if (index == nullptr) {
- return false;
- }
- return index->GetZeroExtendedValue() >= type->NumberOfComponents();
- }
- } // namespace opt
- } // namespace spvtools
|