/**************************************************************************
|
*
|
* Copyright 2003 VMware, Inc.
|
* All Rights Reserved.
|
*
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
* copy of this software and associated documentation files (the
|
* "Software"), to deal in the Software without restriction, including
|
* without limitation the rights to use, copy, modify, merge, publish,
|
* distribute, sub license, and/or sell copies of the Software, and to
|
* permit persons to whom the Software is furnished to do so, subject to
|
* the following conditions:
|
*
|
* The above copyright notice and this permission notice (including the
|
* next paragraph) shall be included in all copies or substantial portions
|
* of the Software.
|
*
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
|
* IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
|
* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
*
|
**************************************************************************/
|
|
|
#ifndef I915_FPC_H
|
#define I915_FPC_H
|
|
|
#include "i915_context.h"
|
#include "i915_reg.h"
|
|
#include "pipe/p_shader_tokens.h"
|
|
#include "tgsi/tgsi_parse.h"
|
|
#define I915_PROGRAM_SIZE 192
|
|
/* Use those indices for pos/face routing, must be >= num of inputs */
|
#define I915_SEMANTIC_POS 100
|
#define I915_SEMANTIC_FACE 101
|
|
|
/**
|
* Program translation state
|
*/
|
struct i915_fp_compile {
|
struct i915_fragment_shader *shader; /* the shader we're compiling */
|
|
boolean used_constants[I915_MAX_CONSTANT];
|
|
/** maps TGSI immediate index to constant slot */
|
uint num_immediates;
|
uint immediates_map[I915_MAX_CONSTANT];
|
float immediates[I915_MAX_CONSTANT][4];
|
|
boolean first_instruction;
|
|
uint declarations[I915_PROGRAM_SIZE];
|
uint program[I915_PROGRAM_SIZE];
|
|
uint *csr; /**< Cursor, points into program. */
|
|
uint *decl; /**< Cursor, points into declarations. */
|
|
uint decl_s; /**< flags for which s regs need to be decl'd */
|
uint decl_t; /**< flags for which t regs need to be decl'd */
|
|
uint temp_flag; /**< Tracks temporary regs which are in use */
|
uint utemp_flag; /**< Tracks TYPE_U temporary regs which are in use */
|
|
uint register_phases[I915_MAX_TEMPORARY];
|
uint nr_tex_indirect;
|
uint nr_tex_insn;
|
uint nr_alu_insn;
|
uint nr_decl_insn;
|
|
boolean error; /**< Set if i915_program_error() is called */
|
uint NumNativeInstructions;
|
uint NumNativeAluInstructions;
|
uint NumNativeTexInstructions;
|
uint NumNativeTexIndirections;
|
};
|
|
|
/* Having zero and one in here makes the definition of swizzle a lot
|
* easier.
|
*/
|
#define UREG_TYPE_SHIFT 29
|
#define UREG_NR_SHIFT 24
|
#define UREG_CHANNEL_X_NEGATE_SHIFT 23
|
#define UREG_CHANNEL_X_SHIFT 20
|
#define UREG_CHANNEL_Y_NEGATE_SHIFT 19
|
#define UREG_CHANNEL_Y_SHIFT 16
|
#define UREG_CHANNEL_Z_NEGATE_SHIFT 15
|
#define UREG_CHANNEL_Z_SHIFT 12
|
#define UREG_CHANNEL_W_NEGATE_SHIFT 11
|
#define UREG_CHANNEL_W_SHIFT 8
|
#define UREG_CHANNEL_ZERO_NEGATE_MBZ 5
|
#define UREG_CHANNEL_ZERO_SHIFT 4
|
#define UREG_CHANNEL_ONE_NEGATE_MBZ 1
|
#define UREG_CHANNEL_ONE_SHIFT 0
|
|
#define UREG_BAD 0xffffffff /* not a valid ureg */
|
|
#define X SRC_X
|
#define Y SRC_Y
|
#define Z SRC_Z
|
#define W SRC_W
|
#define ZERO SRC_ZERO
|
#define ONE SRC_ONE
|
|
/* Construct a ureg:
|
*/
|
#define UREG( type, nr ) (((type)<< UREG_TYPE_SHIFT) | \
|
((nr) << UREG_NR_SHIFT) | \
|
(X << UREG_CHANNEL_X_SHIFT) | \
|
(Y << UREG_CHANNEL_Y_SHIFT) | \
|
(Z << UREG_CHANNEL_Z_SHIFT) | \
|
(W << UREG_CHANNEL_W_SHIFT) | \
|
(ZERO << UREG_CHANNEL_ZERO_SHIFT) | \
|
(ONE << UREG_CHANNEL_ONE_SHIFT))
|
|
#define GET_CHANNEL_SRC( reg, channel ) ((reg<<(channel*4)) & (0xf<<20))
|
#define CHANNEL_SRC( src, channel ) (src>>(channel*4))
|
|
#define GET_UREG_TYPE(reg) (((reg)>>UREG_TYPE_SHIFT)®_TYPE_MASK)
|
#define GET_UREG_NR(reg) (((reg)>>UREG_NR_SHIFT)®_NR_MASK)
|
|
|
|
#define UREG_XYZW_CHANNEL_MASK 0x00ffff00
|
|
/* One neat thing about the UREG representation:
|
*/
|
static inline int
|
swizzle(int reg, uint x, uint y, uint z, uint w)
|
{
|
assert(x <= SRC_ONE);
|
assert(y <= SRC_ONE);
|
assert(z <= SRC_ONE);
|
assert(w <= SRC_ONE);
|
return ((reg & ~UREG_XYZW_CHANNEL_MASK) |
|
CHANNEL_SRC(GET_CHANNEL_SRC(reg, x), 0) |
|
CHANNEL_SRC(GET_CHANNEL_SRC(reg, y), 1) |
|
CHANNEL_SRC(GET_CHANNEL_SRC(reg, z), 2) |
|
CHANNEL_SRC(GET_CHANNEL_SRC(reg, w), 3));
|
}
|
|
|
#define A0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
|
#define D0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
|
#define T0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
|
#define A0_SRC0( reg ) (((reg)&UREG_MASK)>>UREG_A0_SRC0_SHIFT_LEFT)
|
#define A1_SRC0( reg ) (((reg)&UREG_MASK)<<UREG_A1_SRC0_SHIFT_RIGHT)
|
#define A1_SRC1( reg ) (((reg)&UREG_MASK)>>UREG_A1_SRC1_SHIFT_LEFT)
|
#define A2_SRC1( reg ) (((reg)&UREG_MASK)<<UREG_A2_SRC1_SHIFT_RIGHT)
|
#define A2_SRC2( reg ) (((reg)&UREG_MASK)>>UREG_A2_SRC2_SHIFT_LEFT)
|
|
/* These are special, and don't have swizzle/negate bits.
|
*/
|
#define T0_SAMPLER( reg ) (GET_UREG_NR(reg)<<T0_SAMPLER_NR_SHIFT)
|
#define T1_ADDRESS_REG( reg ) ((GET_UREG_NR(reg)<<T1_ADDRESS_REG_NR_SHIFT) | \
|
(GET_UREG_TYPE(reg)<<T1_ADDRESS_REG_TYPE_SHIFT))
|
|
|
/* Macros for translating UREG's into the various register fields used
|
* by the I915 programmable unit.
|
*/
|
#define UREG_A0_DEST_SHIFT_LEFT (UREG_TYPE_SHIFT - A0_DEST_TYPE_SHIFT)
|
#define UREG_A0_SRC0_SHIFT_LEFT (UREG_TYPE_SHIFT - A0_SRC0_TYPE_SHIFT)
|
#define UREG_A1_SRC0_SHIFT_RIGHT (A1_SRC0_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
|
#define UREG_A1_SRC1_SHIFT_LEFT (UREG_TYPE_SHIFT - A1_SRC1_TYPE_SHIFT)
|
#define UREG_A2_SRC1_SHIFT_RIGHT (A2_SRC1_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
|
#define UREG_A2_SRC2_SHIFT_LEFT (UREG_TYPE_SHIFT - A2_SRC2_TYPE_SHIFT)
|
|
#define UREG_MASK 0xffffff00
|
#define UREG_TYPE_NR_MASK ((REG_TYPE_MASK << UREG_TYPE_SHIFT) | \
|
(REG_NR_MASK << UREG_NR_SHIFT))
|
|
|
|
|
/***********************************************************************
|
* Public interface for the compiler
|
*/
|
extern void
|
i915_translate_fragment_program( struct i915_context *i915,
|
struct i915_fragment_shader *fs);
|
|
|
|
extern uint i915_get_temp(struct i915_fp_compile *p);
|
extern uint i915_get_utemp(struct i915_fp_compile *p);
|
extern void i915_release_utemps(struct i915_fp_compile *p);
|
|
|
extern uint i915_emit_texld(struct i915_fp_compile *p,
|
uint dest,
|
uint destmask,
|
uint sampler,
|
uint coord,
|
uint op,
|
uint num_coord);
|
|
extern uint i915_emit_arith(struct i915_fp_compile *p,
|
uint op,
|
uint dest,
|
uint mask,
|
uint saturate,
|
uint src0, uint src1, uint src2);
|
|
extern uint i915_emit_decl(struct i915_fp_compile *p,
|
uint type, uint nr, uint d0_flags);
|
|
|
extern uint i915_emit_const1f(struct i915_fp_compile *p, float c0);
|
|
extern uint i915_emit_const2f(struct i915_fp_compile *p,
|
float c0, float c1);
|
|
extern uint i915_emit_const4fv(struct i915_fp_compile *p,
|
const float * c);
|
|
extern uint i915_emit_const4f(struct i915_fp_compile *p,
|
float c0, float c1,
|
float c2, float c3);
|
|
|
/*======================================================================
|
* i915_fpc_translate.c
|
*/
|
|
extern void
|
i915_program_error(struct i915_fp_compile *p, const char *msg, ...);
|
|
|
/*======================================================================
|
* i915_fpc_optimize.c
|
*/
|
|
|
struct i915_src_register
|
{
|
unsigned File : 4; /* TGSI_FILE_ */
|
unsigned Indirect : 1; /* BOOL */
|
unsigned Dimension : 1; /* BOOL */
|
int Index : 16; /* SINT */
|
unsigned SwizzleX : 3; /* TGSI_SWIZZLE_ */
|
unsigned SwizzleY : 3; /* TGSI_SWIZZLE_ */
|
unsigned SwizzleZ : 3; /* TGSI_SWIZZLE_ */
|
unsigned SwizzleW : 3; /* TGSI_SWIZZLE_ */
|
unsigned Absolute : 1; /* BOOL */
|
unsigned Negate : 1; /* BOOL */
|
};
|
|
/* Additional swizzle supported in i915 */
|
#define TGSI_SWIZZLE_ZERO 4
|
#define TGSI_SWIZZLE_ONE 5
|
|
struct i915_dst_register
|
{
|
unsigned File : 4; /* TGSI_FILE_ */
|
unsigned WriteMask : 4; /* TGSI_WRITEMASK_ */
|
unsigned Indirect : 1; /* BOOL */
|
unsigned Dimension : 1; /* BOOL */
|
int Index : 16; /* SINT */
|
unsigned Padding : 6;
|
};
|
|
|
struct i915_full_dst_register
|
{
|
struct i915_dst_register Register;
|
/*
|
struct tgsi_ind_register Indirect;
|
struct tgsi_dimension Dimension;
|
struct tgsi_ind_register DimIndirect;
|
*/
|
};
|
|
struct i915_full_src_register
|
{
|
struct i915_src_register Register;
|
/*
|
struct tgsi_ind_register Indirect;
|
struct tgsi_dimension Dimension;
|
struct tgsi_ind_register DimIndirect;
|
*/
|
};
|
|
struct i915_full_instruction
|
{
|
struct tgsi_instruction Instruction;
|
/*
|
struct tgsi_instruction_label Label;
|
*/
|
struct tgsi_instruction_texture Texture;
|
struct i915_full_dst_register Dst[1];
|
struct i915_full_src_register Src[3];
|
};
|
|
|
union i915_full_token
|
{
|
struct tgsi_token Token;
|
struct tgsi_full_declaration FullDeclaration;
|
struct tgsi_full_immediate FullImmediate;
|
struct i915_full_instruction FullInstruction;
|
struct tgsi_full_property FullProperty;
|
};
|
|
struct i915_token_list
|
{
|
union i915_full_token* Tokens;
|
unsigned NumTokens;
|
};
|
|
extern struct i915_token_list* i915_optimize(const struct tgsi_token *tokens);
|
|
extern void i915_optimize_free(struct i915_token_list *tokens);
|
|
extern uint i915_num_coords(uint tex);
|
|
#endif
|