// Copyright (c) 2017 The Khronos Group Inc. // Copyright (c) 2017 Valve Corporation // Copyright (c) 2017 LunarG Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "block_merge_pass.h" #include "ir_context.h" #include "iterator.h" namespace spvtools { namespace opt { bool BlockMergePass::HasMultipleRefs(uint32_t labId) { bool multiple_refs = false; return !get_def_use_mgr()->WhileEachUser( labId, [&multiple_refs](ir::Instruction* user) { if (user->opcode() != SpvOpName) { if (multiple_refs) return false; multiple_refs = true; } return true; }); } void BlockMergePass::KillInstAndName(ir::Instruction* inst) { std::vector to_kill; get_def_use_mgr()->ForEachUser(inst, [&to_kill](ir::Instruction* user) { if (user->opcode() == SpvOpName) { to_kill.push_back(user); } }); for (auto i : to_kill) { context()->KillInst(i); } context()->KillInst(inst); } bool BlockMergePass::MergeBlocks(ir::Function* func) { bool modified = false; for (auto bi = func->begin(); bi != func->end();) { // Do not merge loop header blocks, at least for now. if (bi->IsLoopHeader()) { ++bi; continue; } // Find block with single successor which has no other predecessors. // Continue and Merge blocks are currently ruled out as second blocks. // Happily any such candidate blocks will have >1 uses due to their // LoopMerge instruction. // TODO(): Deal with phi instructions that reference the // second block. Happily, these references currently inhibit // the merge. auto ii = bi->end(); --ii; ir::Instruction* br = &*ii; if (br->opcode() != SpvOpBranch) { ++bi; continue; } const uint32_t labId = br->GetSingleWordInOperand(0); if (HasMultipleRefs(labId)) { ++bi; continue; } // Merge blocks context()->KillInst(br); auto sbi = bi; for (; sbi != func->end(); ++sbi) if (sbi->id() == labId) break; // If bi is sbi's only predecessor, it dominates sbi and thus // sbi must follow bi in func's ordering. assert(sbi != func->end()); bi->AddInstructions(&*sbi); KillInstAndName(sbi->GetLabelInst()); (void)sbi.Erase(); // reprocess block modified = true; } return modified; } void BlockMergePass::Initialize(ir::IRContext* c) { InitializeProcessing(c); // Initialize extension whitelist InitExtensions(); }; bool BlockMergePass::AllExtensionsSupported() const { // If any extension not in whitelist, return false for (auto& ei : get_module()->extensions()) { const char* extName = reinterpret_cast(&ei.GetInOperand(0).words[0]); if (extensions_whitelist_.find(extName) == extensions_whitelist_.end()) return false; } return true; } Pass::Status BlockMergePass::ProcessImpl() { // Do not process if any disallowed extensions are enabled if (!AllExtensionsSupported()) return Status::SuccessWithoutChange; // Process all entry point functions. ProcessFunction pfn = [this](ir::Function* fp) { return MergeBlocks(fp); }; bool modified = ProcessEntryPointCallTree(pfn, get_module()); return modified ? Status::SuccessWithChange : Status::SuccessWithoutChange; } BlockMergePass::BlockMergePass() {} Pass::Status BlockMergePass::Process(ir::IRContext* c) { Initialize(c); return ProcessImpl(); } void BlockMergePass::InitExtensions() { extensions_whitelist_.clear(); extensions_whitelist_.insert({ "SPV_AMD_shader_explicit_vertex_parameter", "SPV_AMD_shader_trinary_minmax", "SPV_AMD_gcn_shader", "SPV_KHR_shader_ballot", "SPV_AMD_shader_ballot", "SPV_AMD_gpu_shader_half_float", "SPV_KHR_shader_draw_parameters", "SPV_KHR_subgroup_vote", "SPV_KHR_16bit_storage", "SPV_KHR_device_group", "SPV_KHR_multiview", "SPV_NVX_multiview_per_view_attributes", "SPV_NV_viewport_array2", "SPV_NV_stereo_view_rendering", "SPV_NV_sample_mask_override_coverage", "SPV_NV_geometry_shader_passthrough", "SPV_AMD_texture_gather_bias_lod", "SPV_KHR_storage_buffer_storage_class", "SPV_KHR_variable_pointers", "SPV_AMD_gpu_shader_int16", "SPV_KHR_post_depth_coverage", "SPV_KHR_shader_atomic_counter_ops", }); } } // namespace opt } // namespace spvtools