/**************************************************************************
 *
 * Copyright 2003 VMware, Inc.
 * All Rights Reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the
 * "Software"), to deal in the Software without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sub license, and/or sell copies of the Software, and to
 * permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 *
 * The above copyright notice and this permission notice (including the
 * next paragraph) shall be included in all copies or substantial portions
 * of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 *
 **************************************************************************/

#ifndef I915_FPC_H
#define I915_FPC_H

#include "i915_context.h"
#include "i915_reg.h"

#include "pipe/p_shader_tokens.h"

#include "tgsi/tgsi_parse.h"

struct nir_shader;

#define I915_PROGRAM_SIZE 192

/**
 * Program translation state
 */
struct i915_fp_compile {
   struct i915_fragment_shader *shader; /* the shader we're compiling */

   bool used_constants[I915_MAX_CONSTANT];

   /** maps TGSI immediate index to constant slot */
   uint32_t num_immediates;
   uint32_t immediates_map[I915_MAX_CONSTANT];
   float immediates[I915_MAX_CONSTANT][4];

   bool first_instruction;

   uint32_t declarations[I915_PROGRAM_SIZE];
   uint32_t program[I915_PROGRAM_SIZE];

   uint32_t *csr; /**< Cursor, points into program. */

   uint32_t *decl; /**< Cursor, points into declarations. */

   uint32_t decl_s; /**< flags for which s regs need to be decl'd */
   uint32_t decl_t; /**< flags for which t regs need to be decl'd */

   uint32_t temp_flag;  /**< Tracks temporary regs which are in use */
   uint32_t utemp_flag; /**< Tracks TYPE_U temporary regs which are in use */

   uint32_t register_phases[I915_MAX_TEMPORARY];
   uint32_t nr_tex_indirect;
   uint32_t nr_tex_insn;
   uint32_t nr_alu_insn;
   uint32_t nr_decl_insn;

   bool log_program_errors;
   bool error; /**< Set if i915_program_error() is called */
   uint32_t NumNativeInstructions;
   uint32_t NumNativeAluInstructions;
   uint32_t NumNativeTexInstructions;
   uint32_t NumNativeTexIndirections;
};

/* Having zero and one in here makes the definition of swizzle a lot
 * easier.
 */
#define UREG_TYPE_SHIFT              29
#define UREG_NR_SHIFT                24
#define UREG_CHANNEL_X_NEGATE_SHIFT  23
#define UREG_CHANNEL_X_SHIFT         20
#define UREG_CHANNEL_Y_NEGATE_SHIFT  19
#define UREG_CHANNEL_Y_SHIFT         16
#define UREG_CHANNEL_Z_NEGATE_SHIFT  15
#define UREG_CHANNEL_Z_SHIFT         12
#define UREG_CHANNEL_W_NEGATE_SHIFT  11
#define UREG_CHANNEL_W_SHIFT         8
#define UREG_CHANNEL_ZERO_NEGATE_MBZ 5
#define UREG_CHANNEL_ZERO_SHIFT      4
#define UREG_CHANNEL_ONE_NEGATE_MBZ  1
#define UREG_CHANNEL_ONE_SHIFT       0

#define UREG_BAD 0xffffffff /* not a valid ureg */

#define X    SRC_X
#define Y    SRC_Y
#define Z    SRC_Z
#define W    SRC_W
#define ZERO SRC_ZERO
#define ONE  SRC_ONE

/* Construct a ureg:
 */
#define UREG(type, nr)                                                         \
   (((type) << UREG_TYPE_SHIFT) | ((nr) << UREG_NR_SHIFT) |                    \
    (X << UREG_CHANNEL_X_SHIFT) | (Y << UREG_CHANNEL_Y_SHIFT) |                \
    (Z << UREG_CHANNEL_Z_SHIFT) | (W << UREG_CHANNEL_W_SHIFT) |                \
    (ZERO << UREG_CHANNEL_ZERO_SHIFT) | (ONE << UREG_CHANNEL_ONE_SHIFT))

#define GET_CHANNEL_SRC(reg, channel) ((reg << (channel * 4)) & (0xf << 20))
#define CHANNEL_SRC(src, channel)     (src >> (channel * 4))

#define GET_UREG_TYPE(reg) (((reg) >> UREG_TYPE_SHIFT) & REG_TYPE_MASK)
#define GET_UREG_NR(reg)   (((reg) >> UREG_NR_SHIFT) & REG_NR_MASK)

#define UREG_XYZW_CHANNEL_MASK 0x00ffff00

/* One neat thing about the UREG representation:
 */
static inline int
swizzle(int reg, uint32_t x, uint32_t y, uint32_t z, uint32_t w)
{
   assert(x <= SRC_ONE);
   assert(y <= SRC_ONE);
   assert(z <= SRC_ONE);
   assert(w <= SRC_ONE);
   return ((reg & ~UREG_XYZW_CHANNEL_MASK) |
           CHANNEL_SRC(GET_CHANNEL_SRC(reg, x), 0) |
           CHANNEL_SRC(GET_CHANNEL_SRC(reg, y), 1) |
           CHANNEL_SRC(GET_CHANNEL_SRC(reg, z), 2) |
           CHANNEL_SRC(GET_CHANNEL_SRC(reg, w), 3));
}

#define A0_DEST(reg) (((reg)&UREG_TYPE_NR_MASK) >> UREG_A0_DEST_SHIFT_LEFT)
#define D0_DEST(reg) (((reg)&UREG_TYPE_NR_MASK) >> UREG_A0_DEST_SHIFT_LEFT)
#define T0_DEST(reg) (((reg)&UREG_TYPE_NR_MASK) >> UREG_A0_DEST_SHIFT_LEFT)
#define A0_SRC0(reg) (((reg)&UREG_MASK) >> UREG_A0_SRC0_SHIFT_LEFT)
#define A1_SRC0(reg) (((reg)&UREG_MASK) << UREG_A1_SRC0_SHIFT_RIGHT)
#define A1_SRC1(reg) (((reg)&UREG_MASK) >> UREG_A1_SRC1_SHIFT_LEFT)
#define A2_SRC1(reg) (((reg)&UREG_MASK) << UREG_A2_SRC1_SHIFT_RIGHT)
#define A2_SRC2(reg) (((reg)&UREG_MASK) >> UREG_A2_SRC2_SHIFT_LEFT)

/* These are special, and don't have swizzle/negate bits.
 */
#define T0_SAMPLER(reg) (GET_UREG_NR(reg) << T0_SAMPLER_NR_SHIFT)
#define T1_ADDRESS_REG(reg)                                                    \
   ((GET_UREG_NR(reg) << T1_ADDRESS_REG_NR_SHIFT) |                            \
    (GET_UREG_TYPE(reg) << T1_ADDRESS_REG_TYPE_SHIFT))

/* Macros for translating UREG's into the various register fields used
 * by the I915 programmable unit.
 */
#define UREG_A0_DEST_SHIFT_LEFT (UREG_TYPE_SHIFT - A0_DEST_TYPE_SHIFT)
#define UREG_A0_SRC0_SHIFT_LEFT (UREG_TYPE_SHIFT - A0_SRC0_TYPE_SHIFT)
#define UREG_A1_SRC0_SHIFT_RIGHT                                               \
   (A1_SRC0_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
#define UREG_A1_SRC1_SHIFT_LEFT (UREG_TYPE_SHIFT - A1_SRC1_TYPE_SHIFT)
#define UREG_A2_SRC1_SHIFT_RIGHT                                               \
   (A2_SRC1_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
#define UREG_A2_SRC2_SHIFT_LEFT (UREG_TYPE_SHIFT - A2_SRC2_TYPE_SHIFT)

#define UREG_MASK 0xffffff00
#define UREG_TYPE_NR_MASK                                                      \
   ((REG_TYPE_MASK << UREG_TYPE_SHIFT) | (REG_NR_MASK << UREG_NR_SHIFT))

/***********************************************************************
 * Public interface for the compiler
 */
extern void i915_translate_fragment_program(struct i915_context *i915,
                                            struct i915_fragment_shader *fs);

extern uint32_t i915_get_temp(struct i915_fp_compile *p);
extern uint32_t i915_get_utemp(struct i915_fp_compile *p);
extern void i915_release_utemps(struct i915_fp_compile *p);

extern uint32_t i915_emit_texld(struct i915_fp_compile *p, uint32_t dest,
                                uint32_t destmask, uint32_t sampler,
                                uint32_t coord, uint32_t op,
                                uint32_t num_coord);

extern uint32_t i915_emit_arith(struct i915_fp_compile *p, uint32_t op,
                                uint32_t dest, uint32_t mask, uint32_t saturate,
                                uint32_t src0, uint32_t src1, uint32_t src2);

extern uint32_t i915_emit_decl(struct i915_fp_compile *p, uint32_t type,
                               uint32_t nr, uint32_t d0_flags);

extern uint32_t i915_emit_const1f(struct i915_fp_compile *p, float c0);

extern uint32_t i915_emit_const2f(struct i915_fp_compile *p, float c0,
                                  float c1);

extern uint32_t i915_emit_const4fv(struct i915_fp_compile *p, const float *c);

extern uint32_t i915_emit_const4f(struct i915_fp_compile *p, float c0, float c1,
                                  float c2, float c3);

/*======================================================================
 * i915_fpc_translate.c
 */

extern void i915_program_error(struct i915_fp_compile *p, const char *msg, ...);

/*======================================================================
 * i915_fpc_optimize.c
 */

struct i915_src_register {
   unsigned File : 4;      /* TGSI_FILE_ */
   unsigned Indirect : 1;  /* BOOL */
   unsigned Dimension : 1; /* BOOL */
   int Index : 16;         /* SINT */
   unsigned SwizzleX : 3;  /* TGSI_SWIZZLE_ */
   unsigned SwizzleY : 3;  /* TGSI_SWIZZLE_ */
   unsigned SwizzleZ : 3;  /* TGSI_SWIZZLE_ */
   unsigned SwizzleW : 3;  /* TGSI_SWIZZLE_ */
   unsigned Absolute : 1;  /* BOOL */
   unsigned Negate : 1;    /* BOOL */
};

/* Additional swizzle supported in i915 */
#define TGSI_SWIZZLE_ZERO 4
#define TGSI_SWIZZLE_ONE  5

struct i915_dst_register {
   unsigned File : 4;      /* TGSI_FILE_ */
   unsigned WriteMask : 4; /* TGSI_WRITEMASK_ */
   unsigned Indirect : 1;  /* BOOL */
   unsigned Dimension : 1; /* BOOL */
   int Index : 16;         /* SINT */
   unsigned Padding : 6;
};

struct i915_full_dst_register {
   struct i915_dst_register Register;
   /*
      struct tgsi_ind_register               Indirect;
      struct tgsi_dimension                  Dimension;
      struct tgsi_ind_register               DimIndirect;
   */
};

struct i915_full_src_register {
   struct i915_src_register Register;
   /*
      struct tgsi_ind_register         Indirect;
      struct tgsi_dimension            Dimension;
      struct tgsi_ind_register         DimIndirect;
   */
};

struct i915_full_instruction {
   struct tgsi_instruction Instruction;
   /*
      struct tgsi_instruction_label       Label;
   */
   struct tgsi_instruction_texture Texture;
   struct i915_full_dst_register Dst[1];
   struct i915_full_src_register Src[3];
};

union i915_full_token {
   struct tgsi_token Token;
   struct tgsi_full_declaration FullDeclaration;
   struct tgsi_full_immediate FullImmediate;
   struct i915_full_instruction FullInstruction;
   struct tgsi_full_property FullProperty;
};

struct i915_token_list {
   union i915_full_token *Tokens;
   unsigned NumTokens;
};

extern struct i915_token_list *i915_optimize(const struct tgsi_token *tokens);

extern void i915_optimize_free(struct i915_token_list *tokens);

extern uint32_t i915_num_coords(uint32_t tex);

extern bool i915_nir_lower_sincos(struct nir_shader *s);

#endif
