mirror of
https://github.com/KhronosGroup/SPIRV-Tools
synced 2024-11-29 22:41:03 +00:00
1bc0e6f59a
Add a new legalization pass to dedupe invocation interlock instructions DXC will be adding support for HLSL's rasterizer ordered views by using the SPV_EXT_fragment_shader_interlock_extension. That extension stipulates that if an entry point has an interlock ordering execution mode, it must dynamically execute OpBeginInvocationInterlockEXT and OpEndInvocationInterlockEXT, in that order, exactly once. This would be difficult to determine in DXC's SPIR-V backend, so instead we will emit these instructions potentially multiple times, and use this legalization pass to ensure that the final SPIR-V follows the specification. This PR uses data-flow analysis to determine where to place begin and end instructions; in essence, determining whether a block contains or is preceded by a begin instruction is similar to a specialized case of a reaching definitions analysis, where we have only a single definition, such as `bool has_begun = false`. For this simpler case, we can compute the set of blocks using BFS to determine the reachability of the begin instruction. We need to do this for both begin and end instructions, so I have generalized portions of the code to run both forward and backward over the CFG for each respective case.
290 lines
7.5 KiB
CMake
290 lines
7.5 KiB
CMake
# Copyright (c) 2016 Google Inc.
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
set(SPIRV_TOOLS_OPT_SOURCES
|
|
fix_func_call_arguments.h
|
|
aggressive_dead_code_elim_pass.h
|
|
amd_ext_to_khr.h
|
|
analyze_live_input_pass.h
|
|
basic_block.h
|
|
block_merge_pass.h
|
|
block_merge_util.h
|
|
build_module.h
|
|
ccp_pass.h
|
|
cfg_cleanup_pass.h
|
|
cfg.h
|
|
code_sink.h
|
|
combine_access_chains.h
|
|
compact_ids_pass.h
|
|
composite.h
|
|
const_folding_rules.h
|
|
constants.h
|
|
control_dependence.h
|
|
convert_to_sampled_image_pass.h
|
|
convert_to_half_pass.h
|
|
copy_prop_arrays.h
|
|
dataflow.h
|
|
dead_branch_elim_pass.h
|
|
dead_insert_elim_pass.h
|
|
dead_variable_elimination.h
|
|
decoration_manager.h
|
|
debug_info_manager.h
|
|
def_use_manager.h
|
|
desc_sroa.h
|
|
desc_sroa_util.h
|
|
dominator_analysis.h
|
|
dominator_tree.h
|
|
eliminate_dead_constant_pass.h
|
|
eliminate_dead_functions_pass.h
|
|
eliminate_dead_functions_util.h
|
|
eliminate_dead_io_components_pass.h
|
|
eliminate_dead_members_pass.h
|
|
eliminate_dead_output_stores_pass.h
|
|
empty_pass.h
|
|
feature_manager.h
|
|
fix_storage_class.h
|
|
flatten_decoration_pass.h
|
|
fold.h
|
|
folding_rules.h
|
|
fold_spec_constant_op_and_composite_pass.h
|
|
freeze_spec_constant_value_pass.h
|
|
function.h
|
|
graphics_robust_access_pass.h
|
|
if_conversion.h
|
|
inline_exhaustive_pass.h
|
|
inline_opaque_pass.h
|
|
inline_pass.h
|
|
inst_bindless_check_pass.h
|
|
inst_buff_addr_check_pass.h
|
|
inst_debug_printf_pass.h
|
|
instruction.h
|
|
instruction_list.h
|
|
instrument_pass.h
|
|
interface_var_sroa.h
|
|
invocation_interlock_placement_pass.h
|
|
interp_fixup_pass.h
|
|
ir_builder.h
|
|
ir_context.h
|
|
ir_loader.h
|
|
licm_pass.h
|
|
liveness.h
|
|
local_access_chain_convert_pass.h
|
|
local_redundancy_elimination.h
|
|
local_single_block_elim_pass.h
|
|
local_single_store_elim_pass.h
|
|
log.h
|
|
loop_dependence.h
|
|
loop_descriptor.h
|
|
loop_fission.h
|
|
loop_fusion.h
|
|
loop_fusion_pass.h
|
|
loop_peeling.h
|
|
loop_unroller.h
|
|
loop_utils.h
|
|
loop_unswitch_pass.h
|
|
mem_pass.h
|
|
merge_return_pass.h
|
|
module.h
|
|
null_pass.h
|
|
passes.h
|
|
pass.h
|
|
pass_manager.h
|
|
private_to_local_pass.h
|
|
propagator.h
|
|
reduce_load_size.h
|
|
redundancy_elimination.h
|
|
reflect.h
|
|
register_pressure.h
|
|
relax_float_ops_pass.h
|
|
remove_dontinline_pass.h
|
|
remove_duplicates_pass.h
|
|
remove_unused_interface_variables_pass.h
|
|
replace_desc_array_access_using_var_index.h
|
|
replace_invalid_opc.h
|
|
scalar_analysis.h
|
|
scalar_analysis_nodes.h
|
|
scalar_replacement_pass.h
|
|
set_spec_constant_default_value_pass.h
|
|
simplification_pass.h
|
|
spread_volatile_semantics.h
|
|
ssa_rewrite_pass.h
|
|
strength_reduction_pass.h
|
|
strip_debug_info_pass.h
|
|
strip_nonsemantic_info_pass.h
|
|
struct_cfg_analysis.h
|
|
switch_descriptorset_pass.h
|
|
tree_iterator.h
|
|
trim_capabilities_pass.h
|
|
type_manager.h
|
|
types.h
|
|
unify_const_pass.h
|
|
upgrade_memory_model.h
|
|
value_number_table.h
|
|
vector_dce.h
|
|
workaround1209.h
|
|
wrap_opkill.h
|
|
|
|
fix_func_call_arguments.cpp
|
|
aggressive_dead_code_elim_pass.cpp
|
|
amd_ext_to_khr.cpp
|
|
analyze_live_input_pass.cpp
|
|
basic_block.cpp
|
|
block_merge_pass.cpp
|
|
block_merge_util.cpp
|
|
build_module.cpp
|
|
ccp_pass.cpp
|
|
cfg_cleanup_pass.cpp
|
|
cfg.cpp
|
|
code_sink.cpp
|
|
combine_access_chains.cpp
|
|
compact_ids_pass.cpp
|
|
composite.cpp
|
|
const_folding_rules.cpp
|
|
constants.cpp
|
|
control_dependence.cpp
|
|
convert_to_sampled_image_pass.cpp
|
|
convert_to_half_pass.cpp
|
|
copy_prop_arrays.cpp
|
|
dataflow.cpp
|
|
dead_branch_elim_pass.cpp
|
|
dead_insert_elim_pass.cpp
|
|
dead_variable_elimination.cpp
|
|
decoration_manager.cpp
|
|
debug_info_manager.cpp
|
|
def_use_manager.cpp
|
|
desc_sroa.cpp
|
|
desc_sroa_util.cpp
|
|
dominator_analysis.cpp
|
|
dominator_tree.cpp
|
|
eliminate_dead_constant_pass.cpp
|
|
eliminate_dead_functions_pass.cpp
|
|
eliminate_dead_functions_util.cpp
|
|
eliminate_dead_io_components_pass.cpp
|
|
eliminate_dead_members_pass.cpp
|
|
eliminate_dead_output_stores_pass.cpp
|
|
feature_manager.cpp
|
|
fix_storage_class.cpp
|
|
flatten_decoration_pass.cpp
|
|
fold.cpp
|
|
folding_rules.cpp
|
|
fold_spec_constant_op_and_composite_pass.cpp
|
|
freeze_spec_constant_value_pass.cpp
|
|
function.cpp
|
|
graphics_robust_access_pass.cpp
|
|
if_conversion.cpp
|
|
inline_exhaustive_pass.cpp
|
|
inline_opaque_pass.cpp
|
|
inline_pass.cpp
|
|
inst_bindless_check_pass.cpp
|
|
inst_buff_addr_check_pass.cpp
|
|
inst_debug_printf_pass.cpp
|
|
instruction.cpp
|
|
instruction_list.cpp
|
|
instrument_pass.cpp
|
|
interface_var_sroa.cpp
|
|
invocation_interlock_placement_pass.cpp
|
|
interp_fixup_pass.cpp
|
|
ir_context.cpp
|
|
ir_loader.cpp
|
|
licm_pass.cpp
|
|
liveness.cpp
|
|
local_access_chain_convert_pass.cpp
|
|
local_redundancy_elimination.cpp
|
|
local_single_block_elim_pass.cpp
|
|
local_single_store_elim_pass.cpp
|
|
loop_dependence.cpp
|
|
loop_dependence_helpers.cpp
|
|
loop_descriptor.cpp
|
|
loop_fission.cpp
|
|
loop_fusion.cpp
|
|
loop_fusion_pass.cpp
|
|
loop_peeling.cpp
|
|
loop_utils.cpp
|
|
loop_unroller.cpp
|
|
loop_unswitch_pass.cpp
|
|
mem_pass.cpp
|
|
merge_return_pass.cpp
|
|
module.cpp
|
|
optimizer.cpp
|
|
pass.cpp
|
|
pass_manager.cpp
|
|
private_to_local_pass.cpp
|
|
propagator.cpp
|
|
reduce_load_size.cpp
|
|
redundancy_elimination.cpp
|
|
register_pressure.cpp
|
|
relax_float_ops_pass.cpp
|
|
remove_dontinline_pass.cpp
|
|
remove_duplicates_pass.cpp
|
|
remove_unused_interface_variables_pass.cpp
|
|
replace_desc_array_access_using_var_index.cpp
|
|
replace_invalid_opc.cpp
|
|
scalar_analysis.cpp
|
|
scalar_analysis_simplification.cpp
|
|
scalar_replacement_pass.cpp
|
|
set_spec_constant_default_value_pass.cpp
|
|
simplification_pass.cpp
|
|
spread_volatile_semantics.cpp
|
|
ssa_rewrite_pass.cpp
|
|
strength_reduction_pass.cpp
|
|
strip_debug_info_pass.cpp
|
|
strip_nonsemantic_info_pass.cpp
|
|
struct_cfg_analysis.cpp
|
|
switch_descriptorset_pass.cpp
|
|
trim_capabilities_pass.cpp
|
|
type_manager.cpp
|
|
types.cpp
|
|
unify_const_pass.cpp
|
|
upgrade_memory_model.cpp
|
|
value_number_table.cpp
|
|
vector_dce.cpp
|
|
workaround1209.cpp
|
|
wrap_opkill.cpp
|
|
)
|
|
|
|
if(MSVC AND (NOT ("${CMAKE_CXX_COMPILER_ID}" MATCHES "Clang")))
|
|
# Enable parallel builds across four cores for this lib
|
|
add_definitions(/MP4)
|
|
endif()
|
|
|
|
spvtools_pch(SPIRV_TOOLS_OPT_SOURCES pch_source_opt)
|
|
|
|
add_library(SPIRV-Tools-opt ${SPIRV_TOOLS_LIBRARY_TYPE} ${SPIRV_TOOLS_OPT_SOURCES})
|
|
|
|
spvtools_default_compile_options(SPIRV-Tools-opt)
|
|
target_include_directories(SPIRV-Tools-opt
|
|
PUBLIC
|
|
$<BUILD_INTERFACE:${spirv-tools_SOURCE_DIR}/include>
|
|
$<BUILD_INTERFACE:${SPIRV_HEADER_INCLUDE_DIR}>
|
|
$<INSTALL_INTERFACE:${CMAKE_INSTALL_INCLUDEDIR}>
|
|
PRIVATE ${spirv-tools_BINARY_DIR}
|
|
)
|
|
# We need the assembling and disassembling functionalities in the main library.
|
|
target_link_libraries(SPIRV-Tools-opt
|
|
PUBLIC ${SPIRV_TOOLS_FULL_VISIBILITY})
|
|
|
|
set_property(TARGET SPIRV-Tools-opt PROPERTY FOLDER "SPIRV-Tools libraries")
|
|
spvtools_check_symbol_exports(SPIRV-Tools-opt)
|
|
|
|
if(ENABLE_SPIRV_TOOLS_INSTALL)
|
|
install(TARGETS SPIRV-Tools-opt EXPORT SPIRV-Tools-optTargets)
|
|
export(EXPORT SPIRV-Tools-optTargets FILE SPIRV-Tools-optTargets.cmake)
|
|
|
|
spvtools_config_package_dir(SPIRV-Tools-opt PACKAGE_DIR)
|
|
install(EXPORT SPIRV-Tools-optTargets FILE SPIRV-Tools-optTargets.cmake
|
|
DESTINATION ${PACKAGE_DIR})
|
|
|
|
spvtools_generate_config_file(SPIRV-Tools-opt)
|
|
install(FILES ${CMAKE_BINARY_DIR}/SPIRV-Tools-optConfig.cmake DESTINATION ${PACKAGE_DIR})
|
|
endif(ENABLE_SPIRV_TOOLS_INSTALL)
|