Subversion Repositories Kolibri OS

Rev

Go to most recent revision | Blame | Last modification | View Log | RSS feed

  1. /*
  2.  * Copyright (C) 2008 Nicolai Haehnle.
  3.  *
  4.  * All Rights Reserved.
  5.  *
  6.  * Permission is hereby granted, free of charge, to any person obtaining
  7.  * a copy of this software and associated documentation files (the
  8.  * "Software"), to deal in the Software without restriction, including
  9.  * without limitation the rights to use, copy, modify, merge, publish,
  10.  * distribute, sublicense, and/or sell copies of the Software, and to
  11.  * permit persons to whom the Software is furnished to do so, subject to
  12.  * the following conditions:
  13.  *
  14.  * The above copyright notice and this permission notice (including the
  15.  * next paragraph) shall be included in all copies or substantial
  16.  * portions of the Software.
  17.  *
  18.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  19.  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20.  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  21.  * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
  22.  * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
  23.  * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
  24.  * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25.  *
  26.  */
  27.  
  28. /**
  29.  * @file
  30.  * Utilities to deal with the somewhat odd restriction on R300 fragment
  31.  * program swizzles.
  32.  */
  33.  
  34. #include "r300_fragprog_swizzle.h"
  35.  
  36. #include <stdio.h>
  37.  
  38. #include "../r300_reg.h"
  39. #include "radeon_compiler.h"
  40.  
  41. #define MAKE_SWZ3(x, y, z) (RC_MAKE_SWIZZLE(RC_SWIZZLE_##x, RC_SWIZZLE_##y, RC_SWIZZLE_##z, RC_SWIZZLE_ZERO))
  42.  
  43. struct swizzle_data {
  44.         unsigned int hash; /**< swizzle value this matches */
  45.         unsigned int base; /**< base value for hw swizzle */
  46.         unsigned int stride; /**< difference in base between arg0/1/2 */
  47.         unsigned int srcp_stride; /**< difference in base between arg0/scrp */
  48. };
  49.  
  50. static const struct swizzle_data native_swizzles[] = {
  51.         {MAKE_SWZ3(X, Y, Z), R300_ALU_ARGC_SRC0C_XYZ, 4, 15},
  52.         {MAKE_SWZ3(X, X, X), R300_ALU_ARGC_SRC0C_XXX, 4, 15},
  53.         {MAKE_SWZ3(Y, Y, Y), R300_ALU_ARGC_SRC0C_YYY, 4, 15},
  54.         {MAKE_SWZ3(Z, Z, Z), R300_ALU_ARGC_SRC0C_ZZZ, 4, 15},
  55.         {MAKE_SWZ3(W, W, W), R300_ALU_ARGC_SRC0A, 1, 7},
  56.         {MAKE_SWZ3(Y, Z, X), R300_ALU_ARGC_SRC0C_YZX, 1, 0},
  57.         {MAKE_SWZ3(Z, X, Y), R300_ALU_ARGC_SRC0C_ZXY, 1, 0},
  58.         {MAKE_SWZ3(W, Z, Y), R300_ALU_ARGC_SRC0CA_WZY, 1, 0},
  59.         {MAKE_SWZ3(ONE, ONE, ONE), R300_ALU_ARGC_ONE, 0, 0},
  60.         {MAKE_SWZ3(ZERO, ZERO, ZERO), R300_ALU_ARGC_ZERO, 0, 0},
  61.         {MAKE_SWZ3(HALF, HALF, HALF), R300_ALU_ARGC_HALF, 0, 0}
  62. };
  63.  
  64. static const int num_native_swizzles = sizeof(native_swizzles)/sizeof(native_swizzles[0]);
  65.  
  66. /**
  67.  * Find a native RGB swizzle that matches the given swizzle.
  68.  * Returns 0 if none found.
  69.  */
  70. static const struct swizzle_data* lookup_native_swizzle(unsigned int swizzle)
  71. {
  72.         int i, comp;
  73.  
  74.         for(i = 0; i < num_native_swizzles; ++i) {
  75.                 const struct swizzle_data* sd = &native_swizzles[i];
  76.                 for(comp = 0; comp < 3; ++comp) {
  77.                         unsigned int swz = GET_SWZ(swizzle, comp);
  78.                         if (swz == RC_SWIZZLE_UNUSED)
  79.                                 continue;
  80.                         if (swz != GET_SWZ(sd->hash, comp))
  81.                                 break;
  82.                 }
  83.                 if (comp == 3)
  84.                         return sd;
  85.         }
  86.  
  87.         return 0;
  88. }
  89.  
  90. /**
  91.  * Determines if the given swizzle is valid for r300/r400.  In most situations
  92.  * it is better to use r300_swizzle_is_native() which can be accesed via
  93.  * struct radeon_compiler *c; c->SwizzleCaps->IsNative().
  94.  */
  95. int r300_swizzle_is_native_basic(unsigned int swizzle)
  96. {
  97.         if(lookup_native_swizzle(swizzle))
  98.                 return 1;
  99.         else
  100.                 return 0;
  101. }
  102.  
  103. /**
  104.  * Check whether the given instruction supports the swizzle and negate
  105.  * combinations in the given source register.
  106.  */
  107. static int r300_swizzle_is_native(rc_opcode opcode, struct rc_src_register reg)
  108. {
  109.         const struct swizzle_data* sd;
  110.         unsigned int relevant;
  111.         int j;
  112.  
  113.         if (opcode == RC_OPCODE_KIL ||
  114.             opcode == RC_OPCODE_TEX ||
  115.             opcode == RC_OPCODE_TXB ||
  116.             opcode == RC_OPCODE_TXP) {
  117.                 if (reg.Abs || reg.Negate)
  118.                         return 0;
  119.  
  120.                 for(j = 0; j < 4; ++j) {
  121.                         unsigned int swz = GET_SWZ(reg.Swizzle, j);
  122.                         if (swz == RC_SWIZZLE_UNUSED)
  123.                                 continue;
  124.                         if (swz != j)
  125.                                 return 0;
  126.                 }
  127.  
  128.                 return 1;
  129.         }
  130.  
  131.         relevant = 0;
  132.  
  133.         for(j = 0; j < 3; ++j)
  134.                 if (GET_SWZ(reg.Swizzle, j) != RC_SWIZZLE_UNUSED)
  135.                         relevant |= 1 << j;
  136.  
  137.         if ((reg.Negate & relevant) && ((reg.Negate & relevant) != relevant))
  138.                 return 0;
  139.  
  140.         sd = lookup_native_swizzle(reg.Swizzle);
  141.         if (!sd || (reg.File == RC_FILE_PRESUB && sd->srcp_stride == 0))
  142.                 return 0;
  143.  
  144.         return 1;
  145. }
  146.  
  147.  
  148. static void r300_swizzle_split(
  149.                 struct rc_src_register src, unsigned int mask,
  150.                 struct rc_swizzle_split * split)
  151. {
  152.         split->NumPhases = 0;
  153.  
  154.         while(mask) {
  155.                 unsigned int best_matchcount = 0;
  156.                 unsigned int best_matchmask = 0;
  157.                 int i, comp;
  158.  
  159.                 for(i = 0; i < num_native_swizzles; ++i) {
  160.                         const struct swizzle_data *sd = &native_swizzles[i];
  161.                         unsigned int matchcount = 0;
  162.                         unsigned int matchmask = 0;
  163.                         for(comp = 0; comp < 3; ++comp) {
  164.                                 unsigned int swz;
  165.                                 if (!GET_BIT(mask, comp))
  166.                                         continue;
  167.                                 swz = GET_SWZ(src.Swizzle, comp);
  168.                                 if (swz == RC_SWIZZLE_UNUSED)
  169.                                         continue;
  170.                                 if (swz == GET_SWZ(sd->hash, comp)) {
  171.                                         /* check if the negate bit of current component
  172.                                          * is the same for already matched components */
  173.                                         if (matchmask && (!!(src.Negate & matchmask) != !!(src.Negate & (1 << comp))))
  174.                                                 continue;
  175.  
  176.                                         matchcount++;
  177.                                         matchmask |= 1 << comp;
  178.                                 }
  179.                         }
  180.                         if (matchcount > best_matchcount) {
  181.                                 best_matchcount = matchcount;
  182.                                 best_matchmask = matchmask;
  183.                                 if (matchmask == (mask & RC_MASK_XYZ))
  184.                                         break;
  185.                         }
  186.                 }
  187.  
  188.                 if (mask & RC_MASK_W)
  189.                         best_matchmask |= RC_MASK_W;
  190.  
  191.                 split->Phase[split->NumPhases++] = best_matchmask;
  192.                 mask &= ~best_matchmask;
  193.         }
  194. }
  195.  
  196. struct rc_swizzle_caps r300_swizzle_caps = {
  197.         .IsNative = r300_swizzle_is_native,
  198.         .Split = r300_swizzle_split
  199. };
  200.  
  201.  
  202. /**
  203.  * Translate an RGB (XYZ) swizzle into the hardware code for the given
  204.  * instruction source.
  205.  */
  206. unsigned int r300FPTranslateRGBSwizzle(unsigned int src, unsigned int swizzle)
  207. {
  208.         const struct swizzle_data* sd = lookup_native_swizzle(swizzle);
  209.  
  210.         if (!sd || (src == RC_PAIR_PRESUB_SRC && sd->srcp_stride == 0)) {
  211.                 fprintf(stderr, "Not a native swizzle: %08x\n", swizzle);
  212.                 return 0;
  213.         }
  214.  
  215.         if (src == RC_PAIR_PRESUB_SRC) {
  216.                 return sd->base + sd->srcp_stride;
  217.         } else {
  218.                 return sd->base + src*sd->stride;
  219.         }
  220. }
  221.  
  222.  
  223. /**
  224.  * Translate an Alpha (W) swizzle into the hardware code for the given
  225.  * instruction source.
  226.  */
  227. unsigned int r300FPTranslateAlphaSwizzle(unsigned int src, unsigned int swizzle)
  228. {
  229.         unsigned int swz = GET_SWZ(swizzle, 0);
  230.         if (src == RC_PAIR_PRESUB_SRC) {
  231.                 return R300_ALU_ARGA_SRCP_X + swz;
  232.         }
  233.         if (swz < 3)
  234.                 return swz + 3*src;
  235.  
  236.         switch(swz) {
  237.         case RC_SWIZZLE_W: return R300_ALU_ARGA_SRC0A + src;
  238.         case RC_SWIZZLE_ONE: return R300_ALU_ARGA_ONE;
  239.         case RC_SWIZZLE_ZERO: return R300_ALU_ARGA_ZERO;
  240.         case RC_SWIZZLE_HALF: return R300_ALU_ARGA_HALF;
  241.         default: return R300_ALU_ARGA_ONE;
  242.         }
  243. }
  244.