/************************************************************************** * * Copyright 2011-2012 Advanced Micro Devices, Inc. * Copyright 2009 VMware, Inc. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ /** * @file * TGSI to LLVM IR translation. * * @author Jose Fonseca * @author Tom Stellard */ #ifndef LP_BLD_TGSI_H #define LP_BLD_TGSI_H #include "gallivm/lp_bld.h" #include "gallivm/lp_bld_tgsi_action.h" #include "gallivm/lp_bld_limits.h" #include "gallivm/lp_bld_sample.h" #include "gallivm/lp_bld_ir_common.h" #include "lp_bld_type.h" #include "pipe/p_compiler.h" #include "pipe/p_state.h" #include "tgsi/tgsi_exec.h" #include "tgsi/tgsi_scan.h" #include "tgsi/tgsi_info.h" #ifdef __cplusplus extern "C" { #endif #define LP_CHAN_ALL ~0u #define LP_MAX_INSTRUCTIONS 256 struct tgsi_full_declaration; struct tgsi_full_immediate; struct tgsi_full_instruction; struct tgsi_full_src_register; struct tgsi_full_dst_register; struct tgsi_opcode_info; struct tgsi_token; struct tgsi_shader_info; struct lp_build_mask_context; struct gallivm_state; struct lp_derivatives; struct lp_build_gs_iface; enum lp_build_tex_modifier { LP_BLD_TEX_MODIFIER_NONE = 0, LP_BLD_TEX_MODIFIER_PROJECTED, LP_BLD_TEX_MODIFIER_LOD_BIAS, LP_BLD_TEX_MODIFIER_EXPLICIT_LOD, LP_BLD_TEX_MODIFIER_EXPLICIT_DERIV, LP_BLD_TEX_MODIFIER_LOD_ZERO }; /** * Describe a channel of a register. * * The value can be a: * - immediate value (i.e. derived from a IMM register) * - CONST[n].x/y/z/w * - IN[n].x/y/z/w * - undetermined (when .file == TGSI_FILE_NULL) * * This is one of the analysis results, and is used to described * the output color in terms of inputs. */ struct lp_tgsi_channel_info { unsigned file:4; /* TGSI_FILE_* */ unsigned swizzle:3; /* PIPE_SWIZZLE_x */ union { uint32_t index; float value; /* for TGSI_FILE_IMMEDIATE */ } u; }; /** * Describe a texture sampler interpolator. * * The interpolation is described in terms of regular inputs. */ struct lp_tgsi_texture_info { struct lp_tgsi_channel_info coord[4]; unsigned target:8; /* TGSI_TEXTURE_* */ unsigned sampler_unit:8; /* Sampler unit */ unsigned texture_unit:8; /* Texture unit */ unsigned modifier:8; /* LP_BLD_TEX_MODIFIER_* */ }; struct lp_tgsi_info { struct tgsi_shader_info base; /* * Whether any of the texture opcodes access a register file other than * TGSI_FILE_INPUT. * * We could also handle TGSI_FILE_CONST/IMMEDIATE here, but there is little * benefit. */ unsigned indirect_textures:1; /* * Whether any of the texture (sample) ocpodes use different sampler * and sampler view unit. */ unsigned sampler_texture_units_different:1; /* * Whether any immediate values are outside the range of 0 and 1 */ unsigned unclamped_immediates:1; /* * Texture opcode description. Aimed at detecting and described direct * texture opcodes. */ unsigned num_texs; struct lp_tgsi_texture_info tex[PIPE_MAX_SAMPLERS]; /* * Output description. Aimed at detecting and describing simple blit * shaders. */ struct lp_tgsi_channel_info output[PIPE_MAX_SHADER_OUTPUTS][4]; /* * Shortcut pointers into the above (for fragment shaders). */ const struct lp_tgsi_channel_info *cbuf[PIPE_MAX_COLOR_BUFS]; }; /** * Reference to system values. */ struct lp_bld_tgsi_system_values { LLVMValueRef instance_id; LLVMValueRef base_instance; LLVMValueRef vertex_id; LLVMValueRef vertex_id_nobase; LLVMValueRef prim_id; LLVMValueRef basevertex; LLVMValueRef firstvertex; LLVMValueRef invocation_id; LLVMValueRef draw_id; LLVMValueRef thread_id; LLVMValueRef block_id; LLVMValueRef grid_size; LLVMValueRef front_facing; LLVMValueRef work_dim; LLVMValueRef block_size; LLVMValueRef tess_coord; LLVMValueRef tess_outer; LLVMValueRef tess_inner; LLVMValueRef vertices_in; LLVMValueRef sample_id; LLVMValueRef sample_pos; LLVMValueRef sample_mask_in; LLVMValueRef view_index; LLVMValueRef subgroup_id; LLVMValueRef num_subgroups; }; /** * Sampler code generation interface. * * Although texture sampling is a requirement for TGSI translation, it is * a very different problem with several different approaches to it. This * structure establishes an interface for texture sampling code generation, so * that we can easily use different texture sampling strategies. */ struct lp_build_sampler_soa { void (*destroy)( struct lp_build_sampler_soa *sampler ); void (*emit_tex_sample)(const struct lp_build_sampler_soa *sampler, struct gallivm_state *gallivm, const struct lp_sampler_params *params); void (*emit_size_query)( const struct lp_build_sampler_soa *sampler, struct gallivm_state *gallivm, const struct lp_sampler_size_query_params *params); }; struct lp_build_sampler_aos { LLVMValueRef (*emit_fetch_texel)( const struct lp_build_sampler_aos *sampler, struct lp_build_context *bld, unsigned target, /* TGSI_TEXTURE_* */ unsigned unit, LLVMValueRef coords, const struct lp_derivatives derivs, enum lp_build_tex_modifier modifier); }; struct lp_img_params; struct lp_build_image_soa { void (*destroy)( struct lp_build_image_soa *image ); void (*emit_op)(const struct lp_build_image_soa *image, struct gallivm_state *gallivm, const struct lp_img_params *params); void (*emit_size_query)( const struct lp_build_image_soa *sampler, struct gallivm_state *gallivm, const struct lp_sampler_size_query_params *params); }; struct lp_build_fs_iface; struct lp_build_fs_iface { LLVMValueRef (*interp_fn)(const struct lp_build_fs_iface *iface, struct lp_build_context *bld, unsigned attrib, unsigned chan, bool centroid, bool sample, LLVMValueRef indir_index, LLVMValueRef offsets[2]); void (*fb_fetch)(const struct lp_build_fs_iface *iface, struct lp_build_context *bld, unsigned cbuf, LLVMValueRef result[4]); }; void lp_build_tgsi_info(const struct tgsi_token *tokens, struct lp_tgsi_info *info); struct lp_build_tgsi_params { struct lp_type type; struct lp_build_mask_context *mask; LLVMValueRef consts_ptr; LLVMValueRef const_sizes_ptr; const struct lp_bld_tgsi_system_values *system_values; const LLVMValueRef (*inputs)[4]; LLVMValueRef context_ptr; LLVMValueRef thread_data_ptr; const struct lp_build_sampler_soa *sampler; const struct tgsi_shader_info *info; const struct lp_build_gs_iface *gs_iface; const struct lp_build_tcs_iface *tcs_iface; const struct lp_build_tes_iface *tes_iface; LLVMValueRef ssbo_ptr; LLVMValueRef ssbo_sizes_ptr; const struct lp_build_image_soa *image; LLVMValueRef shared_ptr; const struct lp_build_coro_suspend_info *coro; LLVMValueRef kernel_args; const struct lp_build_fs_iface *fs_iface; unsigned gs_vertex_streams; }; void lp_build_tgsi_soa(struct gallivm_state *gallivm, const struct tgsi_token *tokens, const struct lp_build_tgsi_params *params, LLVMValueRef (*outputs)[4]); void lp_build_tgsi_aos(struct gallivm_state *gallivm, const struct tgsi_token *tokens, struct lp_type type, const unsigned char swizzles[4], LLVMValueRef consts_ptr, const LLVMValueRef *inputs, LLVMValueRef *outputs, const struct lp_build_sampler_aos *sampler, const struct tgsi_shader_info *info); struct lp_build_tgsi_inst_list { struct tgsi_full_instruction *instructions; uint max_instructions; uint num_instructions; }; unsigned lp_bld_tgsi_list_init(struct lp_build_tgsi_context * bld_base); unsigned lp_bld_tgsi_add_instruction( struct lp_build_tgsi_context * bld_base, const struct tgsi_full_instruction *inst_to_add); struct lp_build_tgsi_context; typedef LLVMValueRef (*lp_build_emit_fetch_fn)(struct lp_build_tgsi_context *, const struct tgsi_full_src_register *, enum tgsi_opcode_type, unsigned); typedef void (*lp_build_emit_store_reg_fn)(struct lp_build_tgsi_context *, enum tgsi_opcode_type, const struct tgsi_full_dst_register *, unsigned, unsigned, LLVMValueRef, LLVMValueRef); struct lp_build_tgsi_context { struct lp_build_context base; struct lp_build_context uint_bld; struct lp_build_context int_bld; struct lp_build_context dbl_bld; struct lp_build_context uint64_bld; struct lp_build_context int64_bld; /** This array stores functions that are used to transform TGSI opcodes to * LLVM instructions. */ struct lp_build_tgsi_action op_actions[TGSI_OPCODE_LAST]; /* TGSI_OPCODE_RSQ is defined as 1 / sqrt( abs(src0.x) ), rsq_action * should compute 1 / sqrt (src0.x) */ struct lp_build_tgsi_action rsq_action; struct lp_build_tgsi_action sqrt_action; struct lp_build_tgsi_action drsq_action; struct lp_build_tgsi_action dsqrt_action; const struct tgsi_shader_info *info; lp_build_emit_fetch_fn emit_fetch_funcs[TGSI_FILE_COUNT]; lp_build_emit_store_reg_fn emit_store_reg_funcs[TGSI_FILE_COUNT]; LLVMValueRef (*emit_swizzle)(struct lp_build_tgsi_context *, LLVMValueRef, unsigned, unsigned, unsigned, unsigned); void (*emit_debug)(struct lp_build_tgsi_context *, const struct tgsi_full_instruction *, const struct tgsi_opcode_info *); void (*emit_store)(struct lp_build_tgsi_context *, const struct tgsi_full_instruction *, const struct tgsi_opcode_info *, unsigned index, LLVMValueRef dst[4]); void (*emit_declaration)(struct lp_build_tgsi_context *, const struct tgsi_full_declaration *decl); void (*emit_immediate)(struct lp_build_tgsi_context *, const struct tgsi_full_immediate *imm); /* Allow the user to store data in this structure rather than passing it * to every function. */ void * userdata; boolean soa; int pc; struct tgsi_full_instruction *instructions; uint max_instructions; uint num_instructions; /** This function allows the user to insert some instructions at the * beginning of the program. It is optional and does not need to be * implemented. */ void (*emit_prologue)(struct lp_build_tgsi_context*); /** This function allows the user to insert some instructions after * declarations section, but before any other code. * It is optional and does not need to be implemented. */ void (*emit_prologue_post_decl)(struct lp_build_tgsi_context*); /** This function allows the user to insert some instructions at the end of * the program. This callback is intended to be used for emitting * instructions to handle the export for the output registers, but it can * be used for any purpose. Implementing this function is optiona, but * recommended. */ void (*emit_epilogue)(struct lp_build_tgsi_context*); }; struct lp_build_gs_iface { LLVMValueRef (*fetch_input)(const struct lp_build_gs_iface *gs_iface, struct lp_build_context * bld, boolean is_vindex_indirect, LLVMValueRef vertex_index, boolean is_aindex_indirect, LLVMValueRef attrib_index, LLVMValueRef swizzle_index); void (*emit_vertex)(const struct lp_build_gs_iface *gs_iface, struct lp_build_context * bld, LLVMValueRef (*outputs)[4], LLVMValueRef emitted_vertices_vec, LLVMValueRef mask_vec, LLVMValueRef stream_id); void (*end_primitive)(const struct lp_build_gs_iface *gs_iface, struct lp_build_context * bld, LLVMValueRef total_emitted_vertices_vec, LLVMValueRef verts_per_prim_vec, LLVMValueRef emitted_prims_vec, LLVMValueRef mask_vec, unsigned stream); void (*gs_epilogue)(const struct lp_build_gs_iface *gs_iface, LLVMValueRef total_emitted_vertices_vec, LLVMValueRef emitted_prims_vec, unsigned stream); }; struct lp_build_tcs_iface { void (*emit_prologue)(struct lp_build_context * bld); void (*emit_epilogue)(struct lp_build_context * bld); void (*emit_barrier)(struct lp_build_context *bld_base); void (*emit_store_output)(const struct lp_build_tcs_iface *tcs_iface, struct lp_build_context * bld, unsigned name, boolean is_vindex_indirect, LLVMValueRef vertex_index, boolean is_aindex_indirect, LLVMValueRef attrib_index, boolean is_sindex_indirect, LLVMValueRef swizzle_index, LLVMValueRef value, LLVMValueRef mask_vec); LLVMValueRef (*emit_fetch_input)(const struct lp_build_tcs_iface *tcs_iface, struct lp_build_context * bld, boolean is_vindex_indirect, LLVMValueRef vertex_index, boolean is_aindex_indirect, LLVMValueRef attrib_index, boolean is_sindex_indirect, LLVMValueRef swizzle_index); LLVMValueRef (*emit_fetch_output)(const struct lp_build_tcs_iface *tcs_iface, struct lp_build_context * bld, boolean is_vindex_indirect, LLVMValueRef vertex_index, boolean is_aindex_indirect, LLVMValueRef attrib_index, boolean is_sindex_indirect, LLVMValueRef swizzle_index, uint32_t name); }; struct lp_build_tes_iface { LLVMValueRef (*fetch_vertex_input)(const struct lp_build_tes_iface *tes_iface, struct lp_build_context * bld, boolean is_vindex_indirect, LLVMValueRef vertex_index, boolean is_aindex_indirect, LLVMValueRef attrib_index, boolean is_sindex_indirect, LLVMValueRef swizzle_index); LLVMValueRef (*fetch_patch_input)(const struct lp_build_tes_iface *tes_iface, struct lp_build_context * bld, boolean is_aindex_indirect, LLVMValueRef attrib_index, LLVMValueRef swizzle_index); }; struct lp_build_tgsi_soa_context { struct lp_build_tgsi_context bld_base; /* Builder for scalar elements of shader's data type (float) */ struct lp_build_context elem_bld; const struct lp_build_gs_iface *gs_iface; const struct lp_build_tcs_iface *tcs_iface; const struct lp_build_tes_iface *tes_iface; LLVMValueRef emitted_prims_vec_ptr; LLVMValueRef total_emitted_vertices_vec_ptr; LLVMValueRef emitted_vertices_vec_ptr; LLVMValueRef max_output_vertices_vec; LLVMValueRef consts_ptr; LLVMValueRef const_sizes_ptr; LLVMValueRef consts[LP_MAX_TGSI_CONST_BUFFERS]; LLVMValueRef consts_sizes[LP_MAX_TGSI_CONST_BUFFERS]; const LLVMValueRef (*inputs)[TGSI_NUM_CHANNELS]; LLVMValueRef (*outputs)[TGSI_NUM_CHANNELS]; LLVMValueRef context_ptr; LLVMValueRef thread_data_ptr; LLVMValueRef ssbo_ptr; LLVMValueRef ssbo_sizes_ptr; LLVMValueRef ssbos[LP_MAX_TGSI_SHADER_BUFFERS]; LLVMValueRef ssbo_sizes[LP_MAX_TGSI_SHADER_BUFFERS]; LLVMValueRef shared_ptr; const struct lp_build_coro_suspend_info *coro; const struct lp_build_sampler_soa *sampler; const struct lp_build_image_soa *image; struct tgsi_declaration_sampler_view sv[PIPE_MAX_SHADER_SAMPLER_VIEWS]; LLVMValueRef immediates[LP_MAX_INLINED_IMMEDIATES][TGSI_NUM_CHANNELS]; LLVMValueRef temps[LP_MAX_INLINED_TEMPS][TGSI_NUM_CHANNELS]; LLVMValueRef addr[LP_MAX_TGSI_ADDRS][TGSI_NUM_CHANNELS]; /* We allocate/use this array of temps if (1 << TGSI_FILE_TEMPORARY) is * set in the indirect_files field. * The temps[] array above is unused then. */ LLVMValueRef temps_array; /* We allocate/use this array of output if (1 << TGSI_FILE_OUTPUT) is * set in the indirect_files field. * The outputs[] array above is unused then. */ LLVMValueRef outputs_array; /* We allocate/use this array of inputs if (1 << TGSI_FILE_INPUT) is * set in the indirect_files field. * The inputs[] array above is unused then. */ LLVMValueRef inputs_array; /* We allocate/use this array of temps if (1 << TGSI_FILE_IMMEDIATE) is * set in the indirect_files field. */ LLVMValueRef imms_array; struct lp_bld_tgsi_system_values system_values; /** bitmask indicating which register files are accessed indirectly */ unsigned indirect_files; struct lp_build_mask_context *mask; struct lp_exec_mask exec_mask; uint num_immediates; boolean use_immediates_array; }; void lp_emit_declaration_soa( struct lp_build_tgsi_context *bld, const struct tgsi_full_declaration *decl); void lp_emit_immediate_soa( struct lp_build_tgsi_context *bld_base, const struct tgsi_full_immediate *imm); boolean lp_emit_instruction_soa( struct lp_build_tgsi_soa_context *bld, const struct tgsi_full_instruction *inst, const struct tgsi_opcode_info *info); LLVMValueRef lp_get_temp_ptr_soa( struct lp_build_tgsi_soa_context *bld, unsigned index, unsigned chan); LLVMValueRef lp_get_output_ptr( struct lp_build_tgsi_soa_context *bld, unsigned index, unsigned chan); struct lp_build_tgsi_aos_context { struct lp_build_tgsi_context bld_base; /* Builder for integer masks and indices */ struct lp_build_context int_bld; /* * AoS swizzle used: * - swizzles[0] = red index * - swizzles[1] = green index * - swizzles[2] = blue index * - swizzles[3] = alpha index */ unsigned char swizzles[4]; unsigned char inv_swizzles[4]; LLVMValueRef consts_ptr; const LLVMValueRef *inputs; LLVMValueRef *outputs; const struct lp_build_sampler_aos *sampler; struct tgsi_declaration_sampler_view sv[PIPE_MAX_SHADER_SAMPLER_VIEWS]; LLVMValueRef immediates[LP_MAX_INLINED_IMMEDIATES]; LLVMValueRef temps[LP_MAX_INLINED_TEMPS]; LLVMValueRef addr[LP_MAX_TGSI_ADDRS]; /* We allocate/use this array of temps if (1 << TGSI_FILE_TEMPORARY) is * set in the indirect_files field. * The temps[] array above is unused then. */ LLVMValueRef temps_array; /** bitmask indicating which register files are accessed indirectly */ unsigned indirect_files; }; static inline struct lp_build_tgsi_soa_context * lp_soa_context(struct lp_build_tgsi_context *bld_base) { return (struct lp_build_tgsi_soa_context *)bld_base; } static inline struct lp_build_tgsi_aos_context * lp_aos_context(struct lp_build_tgsi_context *bld_base) { return (struct lp_build_tgsi_aos_context *)bld_base; } void lp_emit_declaration_aos( struct lp_build_tgsi_aos_context *bld, const struct tgsi_full_declaration *decl); boolean lp_emit_instruction_aos( struct lp_build_tgsi_aos_context *bld, const struct tgsi_full_instruction *inst, const struct tgsi_opcode_info *info, int *pc); void lp_emit_store_aos( struct lp_build_tgsi_aos_context *bld, const struct tgsi_full_instruction *inst, unsigned index, LLVMValueRef value); void lp_build_fetch_args( struct lp_build_tgsi_context * bld_base, struct lp_build_emit_data * emit_data); LLVMValueRef lp_build_tgsi_inst_llvm_aos( struct lp_build_tgsi_context * bld_base, const struct tgsi_full_instruction *inst); void lp_build_tgsi_intrinsic( const struct lp_build_tgsi_action * action, struct lp_build_tgsi_context * bld_base, struct lp_build_emit_data * emit_data); LLVMValueRef lp_build_emit_llvm( struct lp_build_tgsi_context *bld_base, unsigned tgsi_opcode, struct lp_build_emit_data * emit_data); LLVMValueRef lp_build_emit_llvm_unary( struct lp_build_tgsi_context *bld_base, unsigned tgsi_opcode, LLVMValueRef arg0); LLVMValueRef lp_build_emit_llvm_binary( struct lp_build_tgsi_context *bld_base, unsigned tgsi_opcode, LLVMValueRef arg0, LLVMValueRef arg1); LLVMValueRef lp_build_emit_llvm_ternary( struct lp_build_tgsi_context *bld_base, unsigned tgsi_opcode, LLVMValueRef arg0, LLVMValueRef arg1, LLVMValueRef arg2); boolean lp_build_tgsi_inst_llvm( struct lp_build_tgsi_context * bld_base, const struct tgsi_full_instruction *inst); LLVMValueRef lp_build_emit_fetch_src( struct lp_build_tgsi_context *bld_base, const struct tgsi_full_src_register *reg, enum tgsi_opcode_type stype, const unsigned chan_index); LLVMValueRef lp_build_emit_fetch( struct lp_build_tgsi_context *bld_base, const struct tgsi_full_instruction *inst, unsigned src_op, const unsigned chan_index); LLVMValueRef lp_build_emit_fetch_texoffset( struct lp_build_tgsi_context *bld_base, const struct tgsi_full_instruction *inst, unsigned tex_off_op, const unsigned chan_index); boolean lp_build_tgsi_llvm( struct lp_build_tgsi_context * bld_base, const struct tgsi_token *tokens); #ifdef __cplusplus } #endif #endif /* LP_BLD_TGSI_H */