476 lines
18 KiB
C++
476 lines
18 KiB
C++
// Copyright (c) 2018 The Khronos Group Inc.
|
|
// Copyright (c) 2018 Valve Corporation
|
|
// Copyright (c) 2018 LunarG Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#ifndef LIBSPIRV_OPT_INSTRUMENT_PASS_H_
|
|
#define LIBSPIRV_OPT_INSTRUMENT_PASS_H_
|
|
|
|
#include <list>
|
|
#include <memory>
|
|
#include <vector>
|
|
|
|
#include "source/opt/ir_builder.h"
|
|
#include "source/opt/pass.h"
|
|
#include "spirv-tools/instrument.hpp"
|
|
|
|
// This is a base class to assist in the creation of passes which instrument
|
|
// shader modules. More specifically, passes which replace instructions with a
|
|
// larger and more capable set of instructions. Commonly, these new
|
|
// instructions will add testing of operands and execute different
|
|
// instructions depending on the outcome, including outputting of debug
|
|
// information into a buffer created especially for that purpose.
|
|
//
|
|
// This class contains helper functions to create an InstProcessFunction,
|
|
// which is the heart of any derived class implementing a specific
|
|
// instrumentation pass. It takes an instruction as an argument, decides
|
|
// if it should be instrumented, and generates code to replace it. This class
|
|
// also supplies function InstProcessEntryPointCallTree which applies the
|
|
// InstProcessFunction to every reachable instruction in a module and replaces
|
|
// the instruction with new instructions if generated.
|
|
//
|
|
// Chief among the helper functions are output code generation functions,
|
|
// used to generate code in the shader which writes data to output buffers
|
|
// associated with that validation. Currently one such function,
|
|
// GenDebugStreamWrite, exists. Other such functions may be added in the
|
|
// future. Each is accompanied by documentation describing the format of
|
|
// its output buffer.
|
|
//
|
|
// A validation pass may read or write multiple buffers. All such buffers
|
|
// are located in a single debug descriptor set whose index is passed at the
|
|
// creation of the instrumentation pass. The bindings of the buffers used by
|
|
// a validation pass are permanantly assigned and fixed and documented by
|
|
// the kDebugOutput* static consts.
|
|
|
|
namespace spvtools {
|
|
namespace opt {
|
|
|
|
// Validation Ids
|
|
// These are used to identify the general validation being done and map to
|
|
// its output buffers.
|
|
static const uint32_t kInstValidationIdBindless = 0;
|
|
static const uint32_t kInstValidationIdBuffAddr = 1;
|
|
static const uint32_t kInstValidationIdDebugPrintf = 2;
|
|
|
|
class InstrumentPass : public Pass {
|
|
using cbb_ptr = const BasicBlock*;
|
|
|
|
public:
|
|
using InstProcessFunction =
|
|
std::function<void(BasicBlock::iterator, UptrVectorIterator<BasicBlock>,
|
|
uint32_t, std::vector<std::unique_ptr<BasicBlock>>*)>;
|
|
|
|
~InstrumentPass() override = default;
|
|
|
|
IRContext::Analysis GetPreservedAnalyses() override {
|
|
return IRContext::kAnalysisDefUse | IRContext::kAnalysisDecorations |
|
|
IRContext::kAnalysisCombinators | IRContext::kAnalysisNameMap |
|
|
IRContext::kAnalysisBuiltinVarId | IRContext::kAnalysisConstants;
|
|
}
|
|
|
|
protected:
|
|
// Create instrumentation pass for |validation_id| which utilizes descriptor
|
|
// set |desc_set| for debug input and output buffers and writes |shader_id|
|
|
// into debug output records. |opt_direct_reads| indicates that the pass
|
|
// will see direct input buffer reads and should prepare to optimize them.
|
|
InstrumentPass(uint32_t desc_set, uint32_t shader_id, uint32_t validation_id,
|
|
bool opt_direct_reads = false)
|
|
: Pass(),
|
|
desc_set_(desc_set),
|
|
shader_id_(shader_id),
|
|
validation_id_(validation_id),
|
|
opt_direct_reads_(opt_direct_reads) {}
|
|
|
|
// Initialize state for instrumentation of module.
|
|
void InitializeInstrument();
|
|
|
|
// Call |pfn| on all instructions in all functions in the call tree of the
|
|
// entry points in |module|. If code is generated for an instruction, replace
|
|
// the instruction's block with the new blocks that are generated. Continue
|
|
// processing at the top of the last new block.
|
|
bool InstProcessEntryPointCallTree(InstProcessFunction& pfn);
|
|
|
|
// Move all code in |ref_block_itr| preceding the instruction |ref_inst_itr|
|
|
// to be instrumented into block |new_blk_ptr|.
|
|
void MovePreludeCode(BasicBlock::iterator ref_inst_itr,
|
|
UptrVectorIterator<BasicBlock> ref_block_itr,
|
|
std::unique_ptr<BasicBlock>* new_blk_ptr);
|
|
|
|
// Move all code in |ref_block_itr| succeeding the instruction |ref_inst_itr|
|
|
// to be instrumented into block |new_blk_ptr|.
|
|
void MovePostludeCode(UptrVectorIterator<BasicBlock> ref_block_itr,
|
|
BasicBlock* new_blk_ptr);
|
|
|
|
// Generate instructions in |builder| which will atomically fetch and
|
|
// increment the size of the debug output buffer stream of the current
|
|
// validation and write a record to the end of the stream, if enough space
|
|
// in the buffer remains. The record will contain the index of the function
|
|
// and instruction within that function |func_idx, instruction_idx| which
|
|
// generated the record. It will also contain additional information to
|
|
// identify the instance of the shader, depending on the stage |stage_idx|
|
|
// of the shader. Finally, the record will contain validation-specific
|
|
// data contained in |validation_ids| which will identify the validation
|
|
// error as well as the values involved in the error.
|
|
//
|
|
// The output buffer binding written to by the code generated by the function
|
|
// is determined by the validation id specified when each specific
|
|
// instrumentation pass is created.
|
|
//
|
|
// The output buffer is a sequence of 32-bit values with the following
|
|
// format (where all elements are unsigned 32-bit unless otherwise noted):
|
|
//
|
|
// Size
|
|
// Record0
|
|
// Record1
|
|
// Record2
|
|
// ...
|
|
//
|
|
// Size is the number of 32-bit values that have been written or
|
|
// attempted to be written to the output buffer, excluding the Size. It is
|
|
// initialized to 0. If the size of attempts to write the buffer exceeds
|
|
// the actual size of the buffer, it is possible that this field can exceed
|
|
// the actual size of the buffer.
|
|
//
|
|
// Each Record* is a variable-length sequence of 32-bit values with the
|
|
// following format defined using static const offsets in the .cpp file:
|
|
//
|
|
// Record Size
|
|
// Shader ID
|
|
// Instruction Index
|
|
// Stage
|
|
// Stage-specific Word 0
|
|
// Stage-specific Word 1
|
|
// ...
|
|
// Validation Error Code
|
|
// Validation-specific Word 0
|
|
// Validation-specific Word 1
|
|
// Validation-specific Word 2
|
|
// ...
|
|
//
|
|
// Each record consists of three subsections: members common across all
|
|
// validation, members specific to the stage, and members specific to a
|
|
// validation.
|
|
//
|
|
// The Record Size is the number of 32-bit words in the record, including
|
|
// the Record Size word.
|
|
//
|
|
// Shader ID is a value that identifies which shader has generated the
|
|
// validation error. It is passed when the instrumentation pass is created.
|
|
//
|
|
// The Instruction Index is the position of the instruction within the
|
|
// SPIR-V file which is in error.
|
|
//
|
|
// The Stage is the pipeline stage which has generated the error as defined
|
|
// by the SpvExecutionModel_ enumeration. This is used to interpret the
|
|
// following Stage-specific words.
|
|
//
|
|
// The Stage-specific Words identify which invocation of the shader generated
|
|
// the error. Every stage will write a fixed number of words. Vertex shaders
|
|
// will write the Vertex and Instance ID. Fragment shaders will write
|
|
// FragCoord.xy. Compute shaders will write the GlobalInvocation ID.
|
|
// The tesselation eval shader will write the Primitive ID and TessCoords.uv.
|
|
// The tesselation control shader and geometry shader will write the
|
|
// Primitive ID and Invocation ID.
|
|
//
|
|
// The Validation Error Code specifies the exact error which has occurred.
|
|
// These are enumerated with the kInstError* static consts. This allows
|
|
// multiple validation layers to use the same, single output buffer.
|
|
//
|
|
// The Validation-specific Words are a validation-specific number of 32-bit
|
|
// words which give further information on the validation error that
|
|
// occurred. These are documented further in each file containing the
|
|
// validation-specific class which derives from this base class.
|
|
//
|
|
// Because the code that is generated checks against the size of the buffer
|
|
// before writing, the size of the debug out buffer can be used by the
|
|
// validation layer to control the number of error records that are written.
|
|
void GenDebugStreamWrite(uint32_t instruction_idx, uint32_t stage_idx,
|
|
const std::vector<uint32_t>& validation_ids,
|
|
InstructionBuilder* builder);
|
|
|
|
// Return true if all instructions in |ids| are constants or spec constants.
|
|
bool AllConstant(const std::vector<uint32_t>& ids);
|
|
|
|
// Generate in |builder| instructions to read the unsigned integer from the
|
|
// input buffer specified by the offsets in |offset_ids|. Given offsets
|
|
// o0, o1, ... oN, and input buffer ibuf, return the id for the value:
|
|
//
|
|
// ibuf[...ibuf[ibuf[o0]+o1]...+oN]
|
|
//
|
|
// The binding and the format of the input buffer is determined by each
|
|
// specific validation, which is specified at the creation of the pass.
|
|
uint32_t GenDebugDirectRead(const std::vector<uint32_t>& offset_ids,
|
|
InstructionBuilder* builder);
|
|
|
|
// Generate code to convert integer |value_id| to 32bit, if needed. Return
|
|
// an id to the 32bit equivalent.
|
|
uint32_t Gen32BitCvtCode(uint32_t value_id, InstructionBuilder* builder);
|
|
|
|
// Generate code to cast integer |value_id| to 32bit unsigned, if needed.
|
|
// Return an id to the Uint equivalent.
|
|
uint32_t GenUintCastCode(uint32_t value_id, InstructionBuilder* builder);
|
|
|
|
// Return new label.
|
|
std::unique_ptr<Instruction> NewLabel(uint32_t label_id);
|
|
|
|
// Return id for 32-bit unsigned type
|
|
uint32_t GetUintId();
|
|
|
|
// Return id for 64-bit unsigned type
|
|
uint32_t GetUint64Id();
|
|
|
|
// Return id for 8-bit unsigned type
|
|
uint32_t GetUint8Id();
|
|
|
|
// Return id for 32-bit unsigned type
|
|
uint32_t GetBoolId();
|
|
|
|
// Return id for void type
|
|
uint32_t GetVoidId();
|
|
|
|
// Return pointer to type for runtime array of uint
|
|
analysis::Type* GetUintXRuntimeArrayType(uint32_t width,
|
|
analysis::Type** rarr_ty);
|
|
|
|
// Return pointer to type for runtime array of uint
|
|
analysis::Type* GetUintRuntimeArrayType(uint32_t width);
|
|
|
|
// Return id for buffer uint type
|
|
uint32_t GetOutputBufferPtrId();
|
|
|
|
// Return id for buffer uint type
|
|
uint32_t GetInputBufferTypeId();
|
|
|
|
// Return id for buffer uint type
|
|
uint32_t GetInputBufferPtrId();
|
|
|
|
// Return binding for output buffer for current validation.
|
|
uint32_t GetOutputBufferBinding();
|
|
|
|
// Return binding for input buffer for current validation.
|
|
uint32_t GetInputBufferBinding();
|
|
|
|
// Add storage buffer extension if needed
|
|
void AddStorageBufferExt();
|
|
|
|
// Return id for debug output buffer
|
|
uint32_t GetOutputBufferId();
|
|
|
|
// Return id for debug input buffer
|
|
uint32_t GetInputBufferId();
|
|
|
|
// Return id for 32-bit float type
|
|
uint32_t GetFloatId();
|
|
|
|
// Return id for v4float type
|
|
uint32_t GetVec4FloatId();
|
|
|
|
// Return id for uint vector type of |length|
|
|
uint32_t GetVecUintId(uint32_t length);
|
|
|
|
// Return id for v4uint type
|
|
uint32_t GetVec4UintId();
|
|
|
|
// Return id for v3uint type
|
|
uint32_t GetVec3UintId();
|
|
|
|
// Return id for output function. Define if it doesn't exist with
|
|
// |val_spec_param_cnt| validation-specific uint32 parameters.
|
|
uint32_t GetStreamWriteFunctionId(uint32_t stage_idx,
|
|
uint32_t val_spec_param_cnt);
|
|
|
|
// Return id for input function taking |param_cnt| uint32 parameters. Define
|
|
// if it doesn't exist.
|
|
uint32_t GetDirectReadFunctionId(uint32_t param_cnt);
|
|
|
|
// Split block |block_itr| into two new blocks where the second block
|
|
// contains |inst_itr| and place in |new_blocks|.
|
|
void SplitBlock(BasicBlock::iterator inst_itr,
|
|
UptrVectorIterator<BasicBlock> block_itr,
|
|
std::vector<std::unique_ptr<BasicBlock>>* new_blocks);
|
|
|
|
// Apply instrumentation function |pfn| to every instruction in |func|.
|
|
// If code is generated for an instruction, replace the instruction's
|
|
// block with the new blocks that are generated. Continue processing at the
|
|
// top of the last new block.
|
|
bool InstrumentFunction(Function* func, uint32_t stage_idx,
|
|
InstProcessFunction& pfn);
|
|
|
|
// Call |pfn| on all functions in the call tree of the function
|
|
// ids in |roots|.
|
|
bool InstProcessCallTreeFromRoots(InstProcessFunction& pfn,
|
|
std::queue<uint32_t>* roots,
|
|
uint32_t stage_idx);
|
|
|
|
// Gen code into |builder| to write |field_value_id| into debug output
|
|
// buffer at |base_offset_id| + |field_offset|.
|
|
void GenDebugOutputFieldCode(uint32_t base_offset_id, uint32_t field_offset,
|
|
uint32_t field_value_id,
|
|
InstructionBuilder* builder);
|
|
|
|
// Generate instructions into |builder| which will write the members
|
|
// of the debug output record common for all stages and validations at
|
|
// |base_off|.
|
|
void GenCommonStreamWriteCode(uint32_t record_sz, uint32_t instruction_idx,
|
|
uint32_t stage_idx, uint32_t base_off,
|
|
InstructionBuilder* builder);
|
|
|
|
// Generate instructions into |builder| which will write
|
|
// |uint_frag_coord_id| at |component| of the record at |base_offset_id| of
|
|
// the debug output buffer .
|
|
void GenFragCoordEltDebugOutputCode(uint32_t base_offset_id,
|
|
uint32_t uint_frag_coord_id,
|
|
uint32_t component,
|
|
InstructionBuilder* builder);
|
|
|
|
// Generate instructions into |builder| which will load |var_id| and return
|
|
// its result id.
|
|
uint32_t GenVarLoad(uint32_t var_id, InstructionBuilder* builder);
|
|
|
|
// Generate instructions into |builder| which will load the uint |builtin_id|
|
|
// and write it into the debug output buffer at |base_off| + |builtin_off|.
|
|
void GenBuiltinOutputCode(uint32_t builtin_id, uint32_t builtin_off,
|
|
uint32_t base_off, InstructionBuilder* builder);
|
|
|
|
// Generate instructions into |builder| which will write the |stage_idx|-
|
|
// specific members of the debug output stream at |base_off|.
|
|
void GenStageStreamWriteCode(uint32_t stage_idx, uint32_t base_off,
|
|
InstructionBuilder* builder);
|
|
|
|
// Return true if instruction must be in the same block that its result
|
|
// is used.
|
|
bool IsSameBlockOp(const Instruction* inst) const;
|
|
|
|
// Clone operands which must be in same block as consumer instructions.
|
|
// Look in same_blk_pre for instructions that need cloning. Look in
|
|
// same_blk_post for instructions already cloned. Add cloned instruction
|
|
// to same_blk_post.
|
|
void CloneSameBlockOps(
|
|
std::unique_ptr<Instruction>* inst,
|
|
std::unordered_map<uint32_t, uint32_t>* same_blk_post,
|
|
std::unordered_map<uint32_t, Instruction*>* same_blk_pre,
|
|
BasicBlock* block_ptr);
|
|
|
|
// Update phis in succeeding blocks to point to new last block
|
|
void UpdateSucceedingPhis(
|
|
std::vector<std::unique_ptr<BasicBlock>>& new_blocks);
|
|
|
|
// Debug descriptor set index
|
|
uint32_t desc_set_;
|
|
|
|
// Shader module ID written into output record
|
|
uint32_t shader_id_;
|
|
|
|
// Map from function id to function pointer.
|
|
std::unordered_map<uint32_t, Function*> id2function_;
|
|
|
|
// Map from block's label id to block. TODO(dnovillo): This is superfluous wrt
|
|
// CFG. It has functionality not present in CFG. Consolidate.
|
|
std::unordered_map<uint32_t, BasicBlock*> id2block_;
|
|
|
|
// Map from instruction's unique id to offset in original file.
|
|
std::unordered_map<uint32_t, uint32_t> uid2offset_;
|
|
|
|
// result id for OpConstantFalse
|
|
uint32_t validation_id_;
|
|
|
|
// id for output buffer variable
|
|
uint32_t output_buffer_id_;
|
|
|
|
// ptr type id for output buffer element
|
|
uint32_t output_buffer_ptr_id_;
|
|
|
|
// ptr type id for input buffer element
|
|
uint32_t input_buffer_ptr_id_;
|
|
|
|
// id for debug output function
|
|
std::unordered_map<uint32_t, uint32_t> param2output_func_id_;
|
|
|
|
// ids for debug input functions
|
|
std::unordered_map<uint32_t, uint32_t> param2input_func_id_;
|
|
|
|
// id for input buffer variable
|
|
uint32_t input_buffer_id_;
|
|
|
|
// id for 32-bit float type
|
|
uint32_t float_id_;
|
|
|
|
// id for v4float type
|
|
uint32_t v4float_id_;
|
|
|
|
// id for v4uint type
|
|
uint32_t v4uint_id_;
|
|
|
|
// id for v3uint type
|
|
uint32_t v3uint_id_;
|
|
|
|
// id for 32-bit unsigned type
|
|
uint32_t uint_id_;
|
|
|
|
// id for 64-bit unsigned type
|
|
uint32_t uint64_id_;
|
|
|
|
// id for 8-bit unsigned type
|
|
uint32_t uint8_id_;
|
|
|
|
// id for bool type
|
|
uint32_t bool_id_;
|
|
|
|
// id for void type
|
|
uint32_t void_id_;
|
|
|
|
// boolean to remember storage buffer extension
|
|
bool storage_buffer_ext_defined_;
|
|
|
|
// runtime array of uint type
|
|
analysis::Type* uint64_rarr_ty_;
|
|
|
|
// runtime array of uint type
|
|
analysis::Type* uint32_rarr_ty_;
|
|
|
|
// Pre-instrumentation same-block insts
|
|
std::unordered_map<uint32_t, Instruction*> same_block_pre_;
|
|
|
|
// Post-instrumentation same-block op ids
|
|
std::unordered_map<uint32_t, uint32_t> same_block_post_;
|
|
|
|
// Map function calls to result id. Clear for every function.
|
|
// This is for debug input reads with constant arguments that
|
|
// have been generated into the first block of the function.
|
|
// This mechanism is used to avoid multiple identical debug
|
|
// input buffer reads.
|
|
struct vector_hash_ {
|
|
std::size_t operator()(const std::vector<uint32_t>& v) const {
|
|
std::size_t hash = v.size();
|
|
for (auto& u : v) {
|
|
hash ^= u + 0x9e3779b9 + (hash << 11) + (hash >> 21);
|
|
}
|
|
return hash;
|
|
}
|
|
};
|
|
std::unordered_map<std::vector<uint32_t>, uint32_t, vector_hash_> call2id_;
|
|
|
|
// Function currently being instrumented
|
|
Function* curr_func_;
|
|
|
|
// Optimize direct debug input buffer reads. Specifically, move all such
|
|
// reads with constant args to first block and reuse them.
|
|
bool opt_direct_reads_;
|
|
};
|
|
|
|
} // namespace opt
|
|
} // namespace spvtools
|
|
|
|
#endif // LIBSPIRV_OPT_INSTRUMENT_PASS_H_
|