Subversion Repositories Kolibri OS

Rev

Go to most recent revision | Blame | Last modification | View Log | RSS feed

  1. /**************************************************************************
  2.  *
  3.  * Copyright 2010, VMware Inc.
  4.  * All Rights Reserved.
  5.  *
  6.  * Permission is hereby granted, free of charge, to any person obtaining a
  7.  * copy of this software and associated documentation files (the
  8.  * "Software"), to deal in the Software without restriction, including
  9.  * without limitation the rights to use, copy, modify, merge, publish,
  10.  * distribute, sub license, and/or sell copies of the Software, and to
  11.  * permit persons to whom the Software is furnished to do so, subject to
  12.  * the following conditions:
  13.  *
  14.  * The above copyright notice and this permission notice (including the
  15.  * next paragraph) shall be included in all copies or substantial portions
  16.  * of the Software.
  17.  *
  18.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  19.  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20.  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
  21.  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
  22.  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
  23.  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
  24.  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25.  *
  26.  **************************************************************************/
  27.  
  28. /*
  29.  * Binning code for points
  30.  */
  31.  
  32. #include "util/u_math.h"
  33. #include "util/u_memory.h"
  34. #include "lp_setup_context.h"
  35. #include "lp_perf.h"
  36. #include "lp_rast.h"
  37. #include "lp_state_fs.h"
  38. #include "lp_state_setup.h"
  39. #include "lp_context.h"
  40. #include "tgsi/tgsi_scan.h"
  41.  
  42. #define NUM_CHANNELS 4
  43.  
  44. struct point_info {
  45.    /* x,y deltas */
  46.    int dy01, dy12;
  47.    int dx01, dx12;
  48.  
  49.    const float (*v0)[4];
  50.  
  51.    float (*a0)[4];
  52.    float (*dadx)[4];
  53.    float (*dady)[4];
  54. };  
  55.  
  56.  
  57. /**
  58.  * Compute a0 for a constant-valued coefficient (GL_FLAT shading).
  59.  */
  60. static void
  61. constant_coef(struct lp_setup_context *setup,
  62.               struct point_info *info,
  63.               unsigned slot,
  64.               const float value,
  65.               unsigned i)
  66. {
  67.    info->a0[slot][i] = value;
  68.    info->dadx[slot][i] = 0.0f;
  69.    info->dady[slot][i] = 0.0f;
  70. }
  71.  
  72.  
  73. static void
  74. point_persp_coeff(struct lp_setup_context *setup,
  75.                   const struct point_info *info,
  76.                   unsigned slot,
  77.                   unsigned i)
  78. {
  79.    /*
  80.     * Fragment shader expects pre-multiplied w for LP_INTERP_PERSPECTIVE. A
  81.     * better stratergy would be to take the primitive in consideration when
  82.     * generating the fragment shader key, and therefore avoid the per-fragment
  83.     * perspective divide.
  84.     */
  85.  
  86.    float w0 = info->v0[0][3];
  87.  
  88.    assert(i < 4);
  89.  
  90.    info->a0[slot][i] = info->v0[slot][i]*w0;
  91.    info->dadx[slot][i] = 0.0f;
  92.    info->dady[slot][i] = 0.0f;
  93. }
  94.  
  95.  
  96. /**
  97.  * Setup automatic texcoord coefficients (for sprite rendering).
  98.  * \param slot  the vertex attribute slot to setup
  99.  * \param i  the attribute channel in [0,3]
  100.  * \param sprite_coord_origin  one of PIPE_SPRITE_COORD_x
  101.  * \param perspective  does the shader expects pre-multiplied w, i.e.,
  102.  *    LP_INTERP_PERSPECTIVE is specified in the shader key
  103.  */
  104. static void
  105. texcoord_coef(struct lp_setup_context *setup,
  106.               const struct point_info *info,
  107.               unsigned slot,
  108.               unsigned i,
  109.               unsigned sprite_coord_origin,
  110.               boolean perspective)
  111. {
  112.    float w0 = info->v0[0][3];
  113.  
  114.    assert(i < 4);
  115.  
  116.    if (i == 0) {
  117.       float dadx = FIXED_ONE / (float)info->dx12;
  118.       float dady =  0.0f;
  119.       float x0 = info->v0[0][0] - setup->pixel_offset;
  120.       float y0 = info->v0[0][1] - setup->pixel_offset;
  121.  
  122.       info->dadx[slot][0] = dadx;
  123.       info->dady[slot][0] = dady;
  124.       info->a0[slot][0] = 0.5 - (dadx * x0 + dady * y0);
  125.  
  126.       if (perspective) {
  127.          info->dadx[slot][0] *= w0;
  128.          info->dady[slot][0] *= w0;
  129.          info->a0[slot][0] *= w0;
  130.       }
  131.    }
  132.    else if (i == 1) {
  133.       float dadx = 0.0f;
  134.       float dady = FIXED_ONE / (float)info->dx12;
  135.       float x0 = info->v0[0][0] - setup->pixel_offset;
  136.       float y0 = info->v0[0][1] - setup->pixel_offset;
  137.  
  138.       if (sprite_coord_origin == PIPE_SPRITE_COORD_LOWER_LEFT) {
  139.          dady = -dady;
  140.       }
  141.  
  142.       info->dadx[slot][1] = dadx;
  143.       info->dady[slot][1] = dady;
  144.       info->a0[slot][1] = 0.5 - (dadx * x0 + dady * y0);
  145.  
  146.       if (perspective) {
  147.          info->dadx[slot][1] *= w0;
  148.          info->dady[slot][1] *= w0;
  149.          info->a0[slot][1] *= w0;
  150.       }
  151.    }
  152.    else if (i == 2) {
  153.       info->a0[slot][2] = 0.0f;
  154.       info->dadx[slot][2] = 0.0f;
  155.       info->dady[slot][2] = 0.0f;
  156.    }
  157.    else {
  158.       info->a0[slot][3] = perspective ? w0 : 1.0f;
  159.       info->dadx[slot][3] = 0.0f;
  160.       info->dady[slot][3] = 0.0f;
  161.    }
  162. }
  163.  
  164.  
  165. /**
  166.  * Special coefficient setup for gl_FragCoord.
  167.  * X and Y are trivial
  168.  * Z and W are copied from position_coef which should have already been computed.
  169.  * We could do a bit less work if we'd examine gl_FragCoord's swizzle mask.
  170.  */
  171. static void
  172. setup_point_fragcoord_coef(struct lp_setup_context *setup,
  173.                            struct point_info *info,
  174.                            unsigned slot,
  175.                            unsigned usage_mask)
  176. {
  177.    /*X*/
  178.    if (usage_mask & TGSI_WRITEMASK_X) {
  179.       info->a0[slot][0] = 0.0;
  180.       info->dadx[slot][0] = 1.0;
  181.       info->dady[slot][0] = 0.0;
  182.    }
  183.  
  184.    /*Y*/
  185.    if (usage_mask & TGSI_WRITEMASK_Y) {
  186.       info->a0[slot][1] = 0.0;
  187.       info->dadx[slot][1] = 0.0;
  188.       info->dady[slot][1] = 1.0;
  189.    }
  190.  
  191.    /*Z*/
  192.    if (usage_mask & TGSI_WRITEMASK_Z) {
  193.       constant_coef(setup, info, slot, info->v0[0][2], 2);
  194.    }
  195.  
  196.    /*W*/
  197.    if (usage_mask & TGSI_WRITEMASK_W) {
  198.       constant_coef(setup, info, slot, info->v0[0][3], 3);
  199.    }
  200. }
  201.  
  202.  
  203. /**
  204.  * Compute the point->coef[] array dadx, dady, a0 values.
  205.  */
  206. static void  
  207. setup_point_coefficients( struct lp_setup_context *setup,
  208.                           struct point_info *info)
  209. {
  210.    const struct lp_setup_variant_key *key = &setup->setup.variant->key;
  211.    const struct lp_fragment_shader *shader = setup->fs.current.variant->shader;
  212.    unsigned fragcoord_usage_mask = TGSI_WRITEMASK_XYZ;
  213.    unsigned slot;
  214.  
  215.    /* setup interpolation for all the remaining attributes:
  216.     */
  217.    for (slot = 0; slot < key->num_inputs; slot++) {
  218.       unsigned vert_attr = key->inputs[slot].src_index;
  219.       unsigned usage_mask = key->inputs[slot].usage_mask;
  220.       enum lp_interp interp = key->inputs[slot].interp;
  221.       boolean perspective = !!(interp == LP_INTERP_PERSPECTIVE);
  222.       unsigned i;
  223.  
  224.       if (perspective & usage_mask) {
  225.          fragcoord_usage_mask |= TGSI_WRITEMASK_W;
  226.       }
  227.      
  228.       switch (interp) {
  229.       case LP_INTERP_POSITION:
  230.          /*
  231.           * The generated pixel interpolators will pick up the coeffs from
  232.           * slot 0, so all need to ensure that the usage mask is covers all
  233.           * usages.
  234.           */
  235.          fragcoord_usage_mask |= usage_mask;
  236.          break;
  237.  
  238.       case LP_INTERP_LINEAR:
  239.          /* Sprite tex coords may use linear interpolation someday */
  240.          /* fall-through */
  241.       case LP_INTERP_PERSPECTIVE:
  242.          /* check if the sprite coord flag is set for this attribute.
  243.           * If so, set it up so it up so x and y vary from 0 to 1.
  244.           */
  245.          if (shader->info.base.input_semantic_name[slot] == TGSI_SEMANTIC_GENERIC) {
  246.             unsigned semantic_index = shader->info.base.input_semantic_index[slot];
  247.             /* Note that sprite_coord enable is a bitfield of
  248.              * PIPE_MAX_SHADER_OUTPUTS bits.
  249.              */
  250.             if (semantic_index < PIPE_MAX_SHADER_OUTPUTS &&
  251.                 (setup->sprite_coord_enable & (1 << semantic_index))) {
  252.                for (i = 0; i < NUM_CHANNELS; i++) {
  253.                   if (usage_mask & (1 << i)) {
  254.                      texcoord_coef(setup, info, slot + 1, i,
  255.                                    setup->sprite_coord_origin,
  256.                                    perspective);
  257.                   }
  258.                }
  259.                break;
  260.             }
  261.          }
  262.          /* fall-through */
  263.       case LP_INTERP_CONSTANT:
  264.          for (i = 0; i < NUM_CHANNELS; i++) {
  265.             if (usage_mask & (1 << i)) {
  266.                if (perspective) {
  267.                   point_persp_coeff(setup, info, slot+1, i);
  268.                }
  269.                else {
  270.                   constant_coef(setup, info, slot+1, info->v0[vert_attr][i], i);
  271.                }
  272.             }
  273.          }
  274.          break;
  275.  
  276.       case LP_INTERP_FACING:
  277.          for (i = 0; i < NUM_CHANNELS; i++)
  278.             if (usage_mask & (1 << i))
  279.                constant_coef(setup, info, slot+1, 1.0, i);
  280.          break;
  281.  
  282.       default:
  283.          assert(0);
  284.          break;
  285.       }
  286.    }
  287.  
  288.    /* The internal position input is in slot zero:
  289.     */
  290.    setup_point_fragcoord_coef(setup, info, 0,
  291.                               fragcoord_usage_mask);
  292. }
  293.  
  294.  
  295. static INLINE int
  296. subpixel_snap(float a)
  297. {
  298.    return util_iround(FIXED_ONE * a);
  299. }
  300.  
  301.  
  302. static boolean
  303. try_setup_point( struct lp_setup_context *setup,
  304.                  const float (*v0)[4] )
  305. {
  306.    struct llvmpipe_context *lp_context = (struct llvmpipe_context *)setup->pipe;
  307.    /* x/y positions in fixed point */
  308.    const struct lp_setup_variant_key *key = &setup->setup.variant->key;
  309.    const int sizeAttr = setup->psize;
  310.    const float size
  311.       = (setup->point_size_per_vertex && sizeAttr > 0) ? v0[sizeAttr][0]
  312.       : setup->point_size;
  313.    
  314.    /* Point size as fixed point integer, remove rounding errors
  315.     * and gives minimum width for very small points
  316.     */
  317.    int fixed_width = MAX2(FIXED_ONE,
  318.                           (subpixel_snap(size) + FIXED_ONE/2 - 1) & ~(FIXED_ONE-1));
  319.  
  320.    const int x0 = subpixel_snap(v0[0][0] - setup->pixel_offset) - fixed_width/2;
  321.    const int y0 = subpixel_snap(v0[0][1] - setup->pixel_offset) - fixed_width/2;
  322.      
  323.    struct lp_scene *scene = setup->scene;
  324.    struct lp_rast_triangle *point;
  325.    unsigned bytes;
  326.    struct u_rect bbox;
  327.    unsigned nr_planes = 4;
  328.    struct point_info info;
  329.    unsigned scissor_index = 0;
  330.    unsigned layer = 0;
  331.  
  332.    if (setup->viewport_index_slot > 0) {
  333.       unsigned *udata = (unsigned*)v0[setup->viewport_index_slot];
  334.       scissor_index = lp_clamp_scissor_idx(*udata);
  335.    }
  336.    if (setup->layer_slot > 0) {
  337.       layer = *(unsigned*)v0[setup->layer_slot];
  338.       layer = MIN2(layer, scene->fb_max_layer);
  339.    }
  340.  
  341.    /* Bounding rectangle (in pixels) */
  342.    {
  343.       /* Yes this is necessary to accurately calculate bounding boxes
  344.        * with the two fill-conventions we support.  GL (normally) ends
  345.        * up needing a bottom-left fill convention, which requires
  346.        * slightly different rounding.
  347.        */
  348.       int adj = (setup->pixel_offset != 0) ? 1 : 0;
  349.  
  350.       bbox.x0 = (x0 + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
  351.       bbox.x1 = (x0 + fixed_width + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
  352.       bbox.y0 = (y0 + (FIXED_ONE-1)) >> FIXED_ORDER;
  353.       bbox.y1 = (y0 + fixed_width + (FIXED_ONE-1)) >> FIXED_ORDER;
  354.  
  355.       /* Inclusive coordinates:
  356.        */
  357.       bbox.x1--;
  358.       bbox.y1--;
  359.    }
  360.    
  361.    if (!u_rect_test_intersection(&setup->draw_regions[scissor_index], &bbox)) {
  362.       if (0) debug_printf("offscreen\n");
  363.       LP_COUNT(nr_culled_tris);
  364.       return TRUE;
  365.    }
  366.  
  367.    u_rect_find_intersection(&setup->draw_regions[scissor_index], &bbox);
  368.  
  369.    point = lp_setup_alloc_triangle(scene,
  370.                                    key->num_inputs,
  371.                                    nr_planes,
  372.                                    &bytes);
  373.    if (!point)
  374.       return FALSE;
  375.  
  376. #ifdef DEBUG
  377.    point->v[0][0] = v0[0][0];
  378.    point->v[0][1] = v0[0][1];
  379. #endif
  380.  
  381.    LP_COUNT(nr_tris);
  382.  
  383.    if (lp_context->active_statistics_queries) {
  384.       lp_context->pipeline_statistics.c_primitives++;
  385.    }
  386.  
  387.    info.v0 = v0;
  388.    info.dx01 = 0;
  389.    info.dx12 = fixed_width;
  390.    info.dy01 = fixed_width;
  391.    info.dy12 = 0;
  392.    info.a0 = GET_A0(&point->inputs);
  393.    info.dadx = GET_DADX(&point->inputs);
  394.    info.dady = GET_DADY(&point->inputs);
  395.    
  396.    /* Setup parameter interpolants:
  397.     */
  398.    setup_point_coefficients(setup, &info);
  399.  
  400.    point->inputs.frontfacing = TRUE;
  401.    point->inputs.disable = FALSE;
  402.    point->inputs.opaque = FALSE;
  403.    point->inputs.layer = layer;
  404.  
  405.    {
  406.       struct lp_rast_plane *plane = GET_PLANES(point);
  407.  
  408.       plane[0].dcdx = -1;
  409.       plane[0].dcdy = 0;
  410.       plane[0].c = 1-bbox.x0;
  411.       plane[0].eo = 1;
  412.  
  413.       plane[1].dcdx = 1;
  414.       plane[1].dcdy = 0;
  415.       plane[1].c = bbox.x1+1;
  416.       plane[1].eo = 0;
  417.  
  418.       plane[2].dcdx = 0;
  419.       plane[2].dcdy = 1;
  420.       plane[2].c = 1-bbox.y0;
  421.       plane[2].eo = 1;
  422.  
  423.       plane[3].dcdx = 0;
  424.       plane[3].dcdy = -1;
  425.       plane[3].c = bbox.y1+1;
  426.       plane[3].eo = 0;
  427.    }
  428.  
  429.    return lp_setup_bin_triangle(setup, point, &bbox, nr_planes, scissor_index);
  430. }
  431.  
  432.  
  433. static void
  434. lp_setup_point(struct lp_setup_context *setup,
  435.                const float (*v0)[4])
  436. {
  437.    if (!try_setup_point( setup, v0 ))
  438.    {
  439.       if (!lp_setup_flush_and_restart(setup))
  440.          return;
  441.  
  442.       if (!try_setup_point( setup, v0 ))
  443.          return;
  444.    }
  445. }
  446.  
  447.  
  448. void
  449. lp_setup_choose_point( struct lp_setup_context *setup )
  450. {
  451.    setup->point = lp_setup_point;
  452. }
  453.  
  454.  
  455.