/*
|
* Copyright 2012 Advanced Micro Devices, Inc.
|
*
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
* copy of this software and associated documentation files (the "Software"),
|
* to deal in the Software without restriction, including without limitation
|
* on the rights to use, copy, modify, merge, publish, distribute, sub
|
* license, and/or sell copies of the Software, and to permit persons to whom
|
* the Software is furnished to do so, subject to the following conditions:
|
*
|
* The above copyright notice and this permission notice (including the next
|
* paragraph) shall be included in all copies or substantial portions of the
|
* Software.
|
*
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
|
* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
|
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
|
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
|
* USE OR OTHER DEALINGS IN THE SOFTWARE.
|
*
|
* Author: Tom Stellard <thomas.stellard@amd.com>
|
*/
|
|
#include "radeon_compiler.h"
|
#include "radeon_compiler_util.h"
|
#include "radeon_dataflow.h"
|
#include "radeon_program.h"
|
#include "radeon_program_constants.h"
|
#include "util/u_bitcast.h"
|
#include <stdio.h>
|
|
#define VERBOSE 0
|
|
#define DBG(...) do { if (VERBOSE) fprintf(stderr, __VA_ARGS__); } while(0)
|
|
/* IEEE-754:
|
* 22:0 mantissa
|
* 30:23 exponent
|
* 31 sign
|
*
|
* R300:
|
* 0:2 mantissa
|
* 3:6 exponent (bias 7)
|
*/
|
static int ieee_754_to_r300_float(float f, unsigned char *r300_float_out)
|
{
|
unsigned float_bits = u_bitcast_f2u(f);
|
/* XXX: Handle big-endian */
|
unsigned mantissa = float_bits & 0x007fffff;
|
unsigned biased_exponent = (float_bits & 0x7f800000) >> 23;
|
unsigned negate = !!(float_bits & 0x80000000);
|
int exponent = biased_exponent - 127;
|
unsigned mantissa_mask = 0xff8fffff;
|
unsigned r300_exponent, r300_mantissa;
|
|
DBG("Converting %f (0x%x) to 7-bit:\n", f, float_bits);
|
DBG("Raw exponent = %d\n", exponent);
|
|
if (exponent < -7 || exponent > 8) {
|
DBG("Failed exponent out of range\n\n");
|
return 0;
|
}
|
|
if (mantissa & mantissa_mask) {
|
DBG("Failed mantisa has too many bits:\n"
|
"manitssa=0x%x mantissa_mask=0x%x, and=0x%x\n\n",
|
mantissa, mantissa_mask,
|
mantissa & mantissa_mask);
|
return 0;
|
}
|
|
r300_exponent = exponent + 7;
|
r300_mantissa = (mantissa & ~mantissa_mask) >> 20;
|
*r300_float_out = r300_mantissa | (r300_exponent << 3);
|
|
DBG("Success! r300_float = 0x%x\n\n", *r300_float_out);
|
|
if (negate)
|
return -1;
|
else
|
return 1;
|
}
|
|
void rc_inline_literals(struct radeon_compiler *c, void *user)
|
{
|
struct rc_instruction * inst;
|
|
for(inst = c->Program.Instructions.Next;
|
inst != &c->Program.Instructions;
|
inst = inst->Next) {
|
const struct rc_opcode_info * info =
|
rc_get_opcode_info(inst->U.I.Opcode);
|
|
unsigned src_idx;
|
struct rc_constant * constant;
|
float float_value;
|
unsigned char r300_float = 0;
|
int ret;
|
|
/* XXX: Handle presub */
|
|
/* We aren't using rc_for_all_reads_src here, because presub
|
* sources need to be handled differently. */
|
for (src_idx = 0; src_idx < info->NumSrcRegs; src_idx++) {
|
unsigned new_swizzle;
|
unsigned use_literal = 0;
|
unsigned negate_mask = 0;
|
unsigned swz, chan;
|
struct rc_src_register * src_reg =
|
&inst->U.I.SrcReg[src_idx];
|
swz = RC_SWIZZLE_UNUSED;
|
if (src_reg->File != RC_FILE_CONSTANT) {
|
continue;
|
}
|
constant =
|
&c->Program.Constants.Constants[src_reg->Index];
|
if (constant->Type != RC_CONSTANT_IMMEDIATE) {
|
continue;
|
}
|
new_swizzle = rc_init_swizzle(RC_SWIZZLE_UNUSED, 0);
|
for (chan = 0; chan < 4; chan++) {
|
unsigned char r300_float_tmp;
|
swz = GET_SWZ(src_reg->Swizzle, chan);
|
if (swz == RC_SWIZZLE_UNUSED) {
|
continue;
|
}
|
float_value = constant->u.Immediate[swz];
|
ret = ieee_754_to_r300_float(float_value,
|
&r300_float_tmp);
|
if (!ret || (use_literal &&
|
r300_float != r300_float_tmp)) {
|
use_literal = 0;
|
break;
|
}
|
|
if (ret == -1 && src_reg->Abs) {
|
use_literal = 0;
|
break;
|
}
|
|
if (!use_literal) {
|
r300_float = r300_float_tmp;
|
use_literal = 1;
|
}
|
|
/* Use RC_SWIZZLE_W for the inline constant, so
|
* it will become one of the alpha sources. */
|
SET_SWZ(new_swizzle, chan, RC_SWIZZLE_W);
|
if (ret == -1) {
|
negate_mask |= (1 << chan);
|
}
|
}
|
|
if (!use_literal) {
|
continue;
|
}
|
src_reg->File = RC_FILE_INLINE;
|
src_reg->Index = r300_float;
|
src_reg->Swizzle = new_swizzle;
|
src_reg->Negate = src_reg->Negate ^ negate_mask;
|
}
|
}
|
}
|