// Copyright (c) 2018 The Khronos Group Inc. // Copyright (c) 2018 Valve Corporation // Copyright (c) 2018 LunarG Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #ifndef LIBSPIRV_OPT_INSTRUMENT_PASS_H_ #define LIBSPIRV_OPT_INSTRUMENT_PASS_H_ #include #include #include #include "source/opt/ir_builder.h" #include "source/opt/pass.h" #include "spirv-tools/instrument.hpp" // This is a base class to assist in the creation of passes which instrument // shader modules. More specifically, passes which replace instructions with a // larger and more capable set of instructions. Commonly, these new // instructions will add testing of operands and execute different // instructions depending on the outcome, including outputting of debug // information into a buffer created especially for that purpose. // // This class contains helper functions to create an InstProcessFunction, // which is the heart of any derived class implementing a specific // instrumentation pass. It takes an instruction as an argument, decides // if it should be instrumented, and generates code to replace it. This class // also supplies function InstProcessEntryPointCallTree which applies the // InstProcessFunction to every reachable instruction in a module and replaces // the instruction with new instructions if generated. // // Chief among the helper functions are output code generation functions, // used to generate code in the shader which writes data to output buffers // associated with that validation. Currently one such function, // GenDebugStreamWrite, exists. Other such functions may be added in the // future. Each is accompanied by documentation describing the format of // its output buffer. // // A validation pass may read or write multiple buffers. All such buffers // are located in a single debug descriptor set whose index is passed at the // creation of the instrumentation pass. The bindings of the buffers used by // a validation pass are permanently assigned and fixed and documented by // the kDebugOutput* static consts. namespace spvtools { namespace opt { // Validation Ids // These are used to identify the general validation being done and map to // its output buffers. static const uint32_t kInstValidationIdBindless = 0; static const uint32_t kInstValidationIdBuffAddr = 1; static const uint32_t kInstValidationIdDebugPrintf = 2; class InstrumentPass : public Pass { using cbb_ptr = const BasicBlock*; public: using InstProcessFunction = std::function, uint32_t, std::vector>*)>; ~InstrumentPass() override = default; IRContext::Analysis GetPreservedAnalyses() override { return IRContext::kAnalysisDefUse | IRContext::kAnalysisDecorations | IRContext::kAnalysisCombinators | IRContext::kAnalysisNameMap | IRContext::kAnalysisBuiltinVarId | IRContext::kAnalysisConstants; } protected: // Create instrumentation pass for |validation_id| which utilizes descriptor // set |desc_set| for debug input and output buffers and writes |shader_id| // into debug output records. |opt_direct_reads| indicates that the pass // will see direct input buffer reads and should prepare to optimize them. InstrumentPass(uint32_t desc_set, uint32_t shader_id, uint32_t validation_id, bool opt_direct_reads = false) : Pass(), desc_set_(desc_set), shader_id_(shader_id), validation_id_(validation_id), opt_direct_reads_(opt_direct_reads) {} // Initialize state for instrumentation of module. void InitializeInstrument(); // Call |pfn| on all instructions in all functions in the call tree of the // entry points in |module|. If code is generated for an instruction, replace // the instruction's block with the new blocks that are generated. Continue // processing at the top of the last new block. bool InstProcessEntryPointCallTree(InstProcessFunction& pfn); // Move all code in |ref_block_itr| preceding the instruction |ref_inst_itr| // to be instrumented into block |new_blk_ptr|. void MovePreludeCode(BasicBlock::iterator ref_inst_itr, UptrVectorIterator ref_block_itr, std::unique_ptr* new_blk_ptr); // Move all code in |ref_block_itr| succeeding the instruction |ref_inst_itr| // to be instrumented into block |new_blk_ptr|. void MovePostludeCode(UptrVectorIterator ref_block_itr, BasicBlock* new_blk_ptr); // Generate instructions in |builder| which will atomically fetch and // increment the size of the debug output buffer stream of the current // validation and write a record to the end of the stream, if enough space // in the buffer remains. The record will contain the index of the function // and instruction within that function |func_idx, instruction_idx| which // generated the record. It will also contain additional information to // identify the instance of the shader, depending on the stage |stage_idx| // of the shader. Finally, the record will contain validation-specific // data contained in |validation_ids| which will identify the validation // error as well as the values involved in the error. // // The output buffer binding written to by the code generated by the function // is determined by the validation id specified when each specific // instrumentation pass is created. // // The output buffer is a sequence of 32-bit values with the following // format (where all elements are unsigned 32-bit unless otherwise noted): // // Size // Record0 // Record1 // Record2 // ... // // Size is the number of 32-bit values that have been written or // attempted to be written to the output buffer, excluding the Size. It is // initialized to 0. If the size of attempts to write the buffer exceeds // the actual size of the buffer, it is possible that this field can exceed // the actual size of the buffer. // // Each Record* is a variable-length sequence of 32-bit values with the // following format defined using static const offsets in the .cpp file: // // Record Size // Shader ID // Instruction Index // Stage // Stage-specific Word 0 // Stage-specific Word 1 // ... // Validation Error Code // Validation-specific Word 0 // Validation-specific Word 1 // Validation-specific Word 2 // ... // // Each record consists of three subsections: members common across all // validation, members specific to the stage, and members specific to a // validation. // // The Record Size is the number of 32-bit words in the record, including // the Record Size word. // // Shader ID is a value that identifies which shader has generated the // validation error. It is passed when the instrumentation pass is created. // // The Instruction Index is the position of the instruction within the // SPIR-V file which is in error. // // The Stage is the pipeline stage which has generated the error as defined // by the SpvExecutionModel_ enumeration. This is used to interpret the // following Stage-specific words. // // The Stage-specific Words identify which invocation of the shader generated // the error. Every stage will write a fixed number of words. Vertex shaders // will write the Vertex and Instance ID. Fragment shaders will write // FragCoord.xy. Compute shaders will write the GlobalInvocation ID. // The tessellation eval shader will write the Primitive ID and TessCoords.uv. // The tessellation control shader and geometry shader will write the // Primitive ID and Invocation ID. // // The Validation Error Code specifies the exact error which has occurred. // These are enumerated with the kInstError* static consts. This allows // multiple validation layers to use the same, single output buffer. // // The Validation-specific Words are a validation-specific number of 32-bit // words which give further information on the validation error that // occurred. These are documented further in each file containing the // validation-specific class which derives from this base class. // // Because the code that is generated checks against the size of the buffer // before writing, the size of the debug out buffer can be used by the // validation layer to control the number of error records that are written. void GenDebugStreamWrite(uint32_t instruction_idx, uint32_t stage_idx, const std::vector& validation_ids, InstructionBuilder* builder); // Return true if all instructions in |ids| are constants or spec constants. bool AllConstant(const std::vector& ids); // Generate in |builder| instructions to read the unsigned integer from the // input buffer specified by the offsets in |offset_ids|. Given offsets // o0, o1, ... oN, and input buffer ibuf, return the id for the value: // // ibuf[...ibuf[ibuf[o0]+o1]...+oN] // // The binding and the format of the input buffer is determined by each // specific validation, which is specified at the creation of the pass. uint32_t GenDebugDirectRead(const std::vector& offset_ids, InstructionBuilder* builder); // Generate code to convert integer |value_id| to 32bit, if needed. Return // an id to the 32bit equivalent. uint32_t Gen32BitCvtCode(uint32_t value_id, InstructionBuilder* builder); // Generate code to cast integer |value_id| to 32bit unsigned, if needed. // Return an id to the Uint equivalent. uint32_t GenUintCastCode(uint32_t value_id, InstructionBuilder* builder); // Return new label. std::unique_ptr NewLabel(uint32_t label_id); // Return id for 32-bit unsigned type uint32_t GetUintId(); // Return id for 64-bit unsigned type uint32_t GetUint64Id(); // Return id for 8-bit unsigned type uint32_t GetUint8Id(); // Return id for 32-bit unsigned type uint32_t GetBoolId(); // Return id for void type uint32_t GetVoidId(); // Return pointer to type for runtime array of uint analysis::Type* GetUintXRuntimeArrayType(uint32_t width, analysis::Type** rarr_ty); // Return pointer to type for runtime array of uint analysis::Type* GetUintRuntimeArrayType(uint32_t width); // Return id for buffer uint type uint32_t GetOutputBufferPtrId(); // Return id for buffer uint type uint32_t GetInputBufferTypeId(); // Return id for buffer uint type uint32_t GetInputBufferPtrId(); // Return binding for output buffer for current validation. uint32_t GetOutputBufferBinding(); // Return binding for input buffer for current validation. uint32_t GetInputBufferBinding(); // Add storage buffer extension if needed void AddStorageBufferExt(); // Return id for debug output buffer uint32_t GetOutputBufferId(); // Return id for debug input buffer uint32_t GetInputBufferId(); // Return id for 32-bit float type uint32_t GetFloatId(); // Return id for v4float type uint32_t GetVec4FloatId(); // Return id for uint vector type of |length| uint32_t GetVecUintId(uint32_t length); // Return id for v4uint type uint32_t GetVec4UintId(); // Return id for v3uint type uint32_t GetVec3UintId(); // Return id for output function. Define if it doesn't exist with // |val_spec_param_cnt| validation-specific uint32 parameters. uint32_t GetStreamWriteFunctionId(uint32_t stage_idx, uint32_t val_spec_param_cnt); // Return id for input function taking |param_cnt| uint32 parameters. Define // if it doesn't exist. uint32_t GetDirectReadFunctionId(uint32_t param_cnt); // Split block |block_itr| into two new blocks where the second block // contains |inst_itr| and place in |new_blocks|. void SplitBlock(BasicBlock::iterator inst_itr, UptrVectorIterator block_itr, std::vector>* new_blocks); // Apply instrumentation function |pfn| to every instruction in |func|. // If code is generated for an instruction, replace the instruction's // block with the new blocks that are generated. Continue processing at the // top of the last new block. bool InstrumentFunction(Function* func, uint32_t stage_idx, InstProcessFunction& pfn); // Call |pfn| on all functions in the call tree of the function // ids in |roots|. bool InstProcessCallTreeFromRoots(InstProcessFunction& pfn, std::queue* roots, uint32_t stage_idx); // Gen code into |builder| to write |field_value_id| into debug output // buffer at |base_offset_id| + |field_offset|. void GenDebugOutputFieldCode(uint32_t base_offset_id, uint32_t field_offset, uint32_t field_value_id, InstructionBuilder* builder); // Generate instructions into |builder| which will write the members // of the debug output record common for all stages and validations at // |base_off|. void GenCommonStreamWriteCode(uint32_t record_sz, uint32_t instruction_idx, uint32_t stage_idx, uint32_t base_off, InstructionBuilder* builder); // Generate instructions into |builder| which will write // |uint_frag_coord_id| at |component| of the record at |base_offset_id| of // the debug output buffer . void GenFragCoordEltDebugOutputCode(uint32_t base_offset_id, uint32_t uint_frag_coord_id, uint32_t component, InstructionBuilder* builder); // Generate instructions into |builder| which will load |var_id| and return // its result id. uint32_t GenVarLoad(uint32_t var_id, InstructionBuilder* builder); // Generate instructions into |builder| which will load the uint |builtin_id| // and write it into the debug output buffer at |base_off| + |builtin_off|. void GenBuiltinOutputCode(uint32_t builtin_id, uint32_t builtin_off, uint32_t base_off, InstructionBuilder* builder); // Generate instructions into |builder| which will write the |stage_idx|- // specific members of the debug output stream at |base_off|. void GenStageStreamWriteCode(uint32_t stage_idx, uint32_t base_off, InstructionBuilder* builder); // Return true if instruction must be in the same block that its result // is used. bool IsSameBlockOp(const Instruction* inst) const; // Clone operands which must be in same block as consumer instructions. // Look in same_blk_pre for instructions that need cloning. Look in // same_blk_post for instructions already cloned. Add cloned instruction // to same_blk_post. void CloneSameBlockOps( std::unique_ptr* inst, std::unordered_map* same_blk_post, std::unordered_map* same_blk_pre, BasicBlock* block_ptr); // Update phis in succeeding blocks to point to new last block void UpdateSucceedingPhis( std::vector>& new_blocks); // Debug descriptor set index uint32_t desc_set_; // Shader module ID written into output record uint32_t shader_id_; // Map from function id to function pointer. std::unordered_map id2function_; // Map from block's label id to block. TODO(dnovillo): This is superfluous wrt // CFG. It has functionality not present in CFG. Consolidate. std::unordered_map id2block_; // Map from instruction's unique id to offset in original file. std::unordered_map uid2offset_; // result id for OpConstantFalse uint32_t validation_id_; // id for output buffer variable uint32_t output_buffer_id_; // ptr type id for output buffer element uint32_t output_buffer_ptr_id_; // ptr type id for input buffer element uint32_t input_buffer_ptr_id_; // id for debug output function std::unordered_map param2output_func_id_; // ids for debug input functions std::unordered_map param2input_func_id_; // id for input buffer variable uint32_t input_buffer_id_; // id for 32-bit float type uint32_t float_id_; // id for v4float type uint32_t v4float_id_; // id for v4uint type uint32_t v4uint_id_; // id for v3uint type uint32_t v3uint_id_; // id for 32-bit unsigned type uint32_t uint_id_; // id for 64-bit unsigned type uint32_t uint64_id_; // id for 8-bit unsigned type uint32_t uint8_id_; // id for bool type uint32_t bool_id_; // id for void type uint32_t void_id_; // boolean to remember storage buffer extension bool storage_buffer_ext_defined_; // runtime array of uint type analysis::Type* uint64_rarr_ty_; // runtime array of uint type analysis::Type* uint32_rarr_ty_; // Pre-instrumentation same-block insts std::unordered_map same_block_pre_; // Post-instrumentation same-block op ids std::unordered_map same_block_post_; // Map function calls to result id. Clear for every function. // This is for debug input reads with constant arguments that // have been generated into the first block of the function. // This mechanism is used to avoid multiple identical debug // input buffer reads. struct vector_hash_ { std::size_t operator()(const std::vector& v) const { std::size_t hash = v.size(); for (auto& u : v) { hash ^= u + 0x9e3779b9 + (hash << 11) + (hash >> 21); } return hash; } }; std::unordered_map, uint32_t, vector_hash_> call2id_; // Function currently being instrumented Function* curr_func_; // Optimize direct debug input buffer reads. Specifically, move all such // reads with constant args to first block and reuse them. bool opt_direct_reads_; }; } // namespace opt } // namespace spvtools #endif // LIBSPIRV_OPT_INSTRUMENT_PASS_H_