Subversion Repositories Kolibri OS

Rev

Blame | Last modification | View Log | RSS feed

  1. /**************************************************************************
  2.  *
  3.  * Copyright 2010, VMware Inc.
  4.  * All Rights Reserved.
  5.  *
  6.  * Permission is hereby granted, free of charge, to any person obtaining a
  7.  * copy of this software and associated documentation files (the
  8.  * "Software"), to deal in the Software without restriction, including
  9.  * without limitation the rights to use, copy, modify, merge, publish,
  10.  * distribute, sub license, and/or sell copies of the Software, and to
  11.  * permit persons to whom the Software is furnished to do so, subject to
  12.  * the following conditions:
  13.  *
  14.  * The above copyright notice and this permission notice (including the
  15.  * next paragraph) shall be included in all copies or substantial portions
  16.  * of the Software.
  17.  *
  18.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  19.  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  20.  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
  21.  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
  22.  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
  23.  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
  24.  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  25.  *
  26.  **************************************************************************/
  27.  
  28. /*
  29.  * Binning code for points
  30.  */
  31.  
  32. #include "util/u_math.h"
  33. #include "util/u_memory.h"
  34. #include "lp_setup_context.h"
  35. #include "lp_perf.h"
  36. #include "lp_rast.h"
  37. #include "lp_state_fs.h"
  38. #include "lp_state_setup.h"
  39. #include "lp_context.h"
  40. #include "tgsi/tgsi_scan.h"
  41. #include "draw/draw_context.h"
  42.  
  43. #define NUM_CHANNELS 4
  44.  
  45. struct point_info {
  46.    /* x,y deltas */
  47.    int dy01, dy12;
  48.    int dx01, dx12;
  49.  
  50.    const float (*v0)[4];
  51.  
  52.    float (*a0)[4];
  53.    float (*dadx)[4];
  54.    float (*dady)[4];
  55.  
  56.    boolean frontfacing;
  57. };  
  58.  
  59.  
  60. /**
  61.  * Compute a0 for a constant-valued coefficient (GL_FLAT shading).
  62.  */
  63. static void
  64. constant_coef(struct lp_setup_context *setup,
  65.               struct point_info *info,
  66.               unsigned slot,
  67.               const float value,
  68.               unsigned i)
  69. {
  70.    info->a0[slot][i] = value;
  71.    info->dadx[slot][i] = 0.0f;
  72.    info->dady[slot][i] = 0.0f;
  73. }
  74.  
  75.  
  76. static void
  77. point_persp_coeff(struct lp_setup_context *setup,
  78.                   const struct point_info *info,
  79.                   unsigned slot,
  80.                   unsigned i)
  81. {
  82.    /*
  83.     * Fragment shader expects pre-multiplied w for LP_INTERP_PERSPECTIVE. A
  84.     * better stratergy would be to take the primitive in consideration when
  85.     * generating the fragment shader key, and therefore avoid the per-fragment
  86.     * perspective divide.
  87.     */
  88.  
  89.    float w0 = info->v0[0][3];
  90.  
  91.    assert(i < 4);
  92.  
  93.    info->a0[slot][i] = info->v0[slot][i]*w0;
  94.    info->dadx[slot][i] = 0.0f;
  95.    info->dady[slot][i] = 0.0f;
  96. }
  97.  
  98.  
  99. /**
  100.  * Setup automatic texcoord coefficients (for sprite rendering).
  101.  * \param slot  the vertex attribute slot to setup
  102.  * \param i  the attribute channel in [0,3]
  103.  * \param sprite_coord_origin  one of PIPE_SPRITE_COORD_x
  104.  * \param perspective  does the shader expects pre-multiplied w, i.e.,
  105.  *    LP_INTERP_PERSPECTIVE is specified in the shader key
  106.  */
  107. static void
  108. texcoord_coef(struct lp_setup_context *setup,
  109.               const struct point_info *info,
  110.               unsigned slot,
  111.               unsigned i,
  112.               unsigned sprite_coord_origin,
  113.               boolean perspective)
  114. {
  115.    float w0 = info->v0[0][3];
  116.  
  117.    assert(i < 4);
  118.  
  119.    if (i == 0) {
  120.       float dadx = FIXED_ONE / (float)info->dx12;
  121.       float dady =  0.0f;
  122.       float x0 = info->v0[0][0] - setup->pixel_offset;
  123.       float y0 = info->v0[0][1] - setup->pixel_offset;
  124.  
  125.       info->dadx[slot][0] = dadx;
  126.       info->dady[slot][0] = dady;
  127.       info->a0[slot][0] = 0.5 - (dadx * x0 + dady * y0);
  128.  
  129.       if (perspective) {
  130.          info->dadx[slot][0] *= w0;
  131.          info->dady[slot][0] *= w0;
  132.          info->a0[slot][0] *= w0;
  133.       }
  134.    }
  135.    else if (i == 1) {
  136.       float dadx = 0.0f;
  137.       float dady = FIXED_ONE / (float)info->dx12;
  138.       float x0 = info->v0[0][0] - setup->pixel_offset;
  139.       float y0 = info->v0[0][1] - setup->pixel_offset;
  140.  
  141.       if (sprite_coord_origin == PIPE_SPRITE_COORD_LOWER_LEFT) {
  142.          dady = -dady;
  143.       }
  144.  
  145.       info->dadx[slot][1] = dadx;
  146.       info->dady[slot][1] = dady;
  147.       info->a0[slot][1] = 0.5 - (dadx * x0 + dady * y0);
  148.  
  149.       if (perspective) {
  150.          info->dadx[slot][1] *= w0;
  151.          info->dady[slot][1] *= w0;
  152.          info->a0[slot][1] *= w0;
  153.       }
  154.    }
  155.    else if (i == 2) {
  156.       info->a0[slot][2] = 0.0f;
  157.       info->dadx[slot][2] = 0.0f;
  158.       info->dady[slot][2] = 0.0f;
  159.    }
  160.    else {
  161.       info->a0[slot][3] = perspective ? w0 : 1.0f;
  162.       info->dadx[slot][3] = 0.0f;
  163.       info->dady[slot][3] = 0.0f;
  164.    }
  165. }
  166.  
  167.  
  168. /**
  169.  * Special coefficient setup for gl_FragCoord.
  170.  * X and Y are trivial
  171.  * Z and W are copied from position_coef which should have already been computed.
  172.  * We could do a bit less work if we'd examine gl_FragCoord's swizzle mask.
  173.  */
  174. static void
  175. setup_point_fragcoord_coef(struct lp_setup_context *setup,
  176.                            struct point_info *info,
  177.                            unsigned slot,
  178.                            unsigned usage_mask)
  179. {
  180.    /*X*/
  181.    if (usage_mask & TGSI_WRITEMASK_X) {
  182.       info->a0[slot][0] = 0.0;
  183.       info->dadx[slot][0] = 1.0;
  184.       info->dady[slot][0] = 0.0;
  185.    }
  186.  
  187.    /*Y*/
  188.    if (usage_mask & TGSI_WRITEMASK_Y) {
  189.       info->a0[slot][1] = 0.0;
  190.       info->dadx[slot][1] = 0.0;
  191.       info->dady[slot][1] = 1.0;
  192.    }
  193.  
  194.    /*Z*/
  195.    if (usage_mask & TGSI_WRITEMASK_Z) {
  196.       constant_coef(setup, info, slot, info->v0[0][2], 2);
  197.    }
  198.  
  199.    /*W*/
  200.    if (usage_mask & TGSI_WRITEMASK_W) {
  201.       constant_coef(setup, info, slot, info->v0[0][3], 3);
  202.    }
  203. }
  204.  
  205.  
  206. /**
  207.  * Compute the point->coef[] array dadx, dady, a0 values.
  208.  */
  209. static void  
  210. setup_point_coefficients( struct lp_setup_context *setup,
  211.                           struct point_info *info)
  212. {
  213.    const struct lp_setup_variant_key *key = &setup->setup.variant->key;
  214.    const struct lp_fragment_shader *shader = setup->fs.current.variant->shader;
  215.    unsigned fragcoord_usage_mask = TGSI_WRITEMASK_XYZ;
  216.    unsigned slot;
  217.  
  218.    /* setup interpolation for all the remaining attributes:
  219.     */
  220.    for (slot = 0; slot < key->num_inputs; slot++) {
  221.       unsigned vert_attr = key->inputs[slot].src_index;
  222.       unsigned usage_mask = key->inputs[slot].usage_mask;
  223.       enum lp_interp interp = key->inputs[slot].interp;
  224.       boolean perspective = !!(interp == LP_INTERP_PERSPECTIVE);
  225.       unsigned i;
  226.  
  227.       if (perspective & usage_mask) {
  228.          fragcoord_usage_mask |= TGSI_WRITEMASK_W;
  229.       }
  230.      
  231.       switch (interp) {
  232.       case LP_INTERP_POSITION:
  233.          /*
  234.           * The generated pixel interpolators will pick up the coeffs from
  235.           * slot 0, so all need to ensure that the usage mask is covers all
  236.           * usages.
  237.           */
  238.          fragcoord_usage_mask |= usage_mask;
  239.          break;
  240.  
  241.       case LP_INTERP_LINEAR:
  242.          /* Sprite tex coords may use linear interpolation someday */
  243.          /* fall-through */
  244.       case LP_INTERP_PERSPECTIVE:
  245.          /* check if the sprite coord flag is set for this attribute.
  246.           * If so, set it up so it up so x and y vary from 0 to 1.
  247.           */
  248.          if (shader->info.base.input_semantic_name[slot] == TGSI_SEMANTIC_GENERIC) {
  249.             unsigned semantic_index = shader->info.base.input_semantic_index[slot];
  250.             /* Note that sprite_coord enable is a bitfield of
  251.              * PIPE_MAX_SHADER_OUTPUTS bits.
  252.              */
  253.             if (semantic_index < PIPE_MAX_SHADER_OUTPUTS &&
  254.                 (setup->sprite_coord_enable & (1 << semantic_index))) {
  255.                for (i = 0; i < NUM_CHANNELS; i++) {
  256.                   if (usage_mask & (1 << i)) {
  257.                      texcoord_coef(setup, info, slot + 1, i,
  258.                                    setup->sprite_coord_origin,
  259.                                    perspective);
  260.                   }
  261.                }
  262.                break;
  263.             }
  264.          }
  265.          /* fall-through */
  266.       case LP_INTERP_CONSTANT:
  267.          for (i = 0; i < NUM_CHANNELS; i++) {
  268.             if (usage_mask & (1 << i)) {
  269.                if (perspective) {
  270.                   point_persp_coeff(setup, info, slot+1, i);
  271.                }
  272.                else {
  273.                   constant_coef(setup, info, slot+1, info->v0[vert_attr][i], i);
  274.                }
  275.             }
  276.          }
  277.          break;
  278.  
  279.       case LP_INTERP_FACING:
  280.          for (i = 0; i < NUM_CHANNELS; i++)
  281.             if (usage_mask & (1 << i))
  282.                constant_coef(setup, info, slot+1,
  283.                              info->frontfacing ? 1.0f : -1.0f, i);
  284.          break;
  285.  
  286.       default:
  287.          assert(0);
  288.          break;
  289.       }
  290.    }
  291.  
  292.    /* The internal position input is in slot zero:
  293.     */
  294.    setup_point_fragcoord_coef(setup, info, 0,
  295.                               fragcoord_usage_mask);
  296. }
  297.  
  298.  
  299. static INLINE int
  300. subpixel_snap(float a)
  301. {
  302.    return util_iround(FIXED_ONE * a);
  303. }
  304.  
  305. /**
  306.  * Print point vertex attribs (for debug).
  307.  */
  308. static void
  309. print_point(struct lp_setup_context *setup,
  310.             const float (*v0)[4],
  311.             const float size)
  312. {
  313.    const struct lp_setup_variant_key *key = &setup->setup.variant->key;
  314.    uint i;
  315.  
  316.    debug_printf("llvmpipe point, width %f\n", size);
  317.    for (i = 0; i < 1 + key->num_inputs; i++) {
  318.       debug_printf("  v0[%d]:  %f %f %f %f\n", i,
  319.                    v0[i][0], v0[i][1], v0[i][2], v0[i][3]);
  320.    }
  321. }
  322.  
  323.  
  324. static boolean
  325. try_setup_point( struct lp_setup_context *setup,
  326.                  const float (*v0)[4] )
  327. {
  328.    struct llvmpipe_context *lp_context = (struct llvmpipe_context *)setup->pipe;
  329.    /* x/y positions in fixed point */
  330.    const struct lp_setup_variant_key *key = &setup->setup.variant->key;
  331.    const int sizeAttr = setup->psize;
  332.    const float size
  333.       = (setup->point_size_per_vertex && sizeAttr > 0) ? v0[sizeAttr][0]
  334.       : setup->point_size;
  335.  
  336.    /* Yes this is necessary to accurately calculate bounding boxes
  337.     * with the two fill-conventions we support.  GL (normally) ends
  338.     * up needing a bottom-left fill convention, which requires
  339.     * slightly different rounding.
  340.     */
  341.    int adj = (setup->bottom_edge_rule != 0) ? 1 : 0;
  342.  
  343.    struct lp_scene *scene = setup->scene;
  344.    struct lp_rast_triangle *point;
  345.    unsigned bytes;
  346.    struct u_rect bbox;
  347.    unsigned nr_planes = 4;
  348.    struct point_info info;
  349.    unsigned viewport_index = 0;
  350.    unsigned layer = 0;
  351.    int fixed_width;
  352.  
  353.    if (setup->viewport_index_slot > 0) {
  354.       unsigned *udata = (unsigned*)v0[setup->viewport_index_slot];
  355.       viewport_index = lp_clamp_viewport_idx(*udata);
  356.    }
  357.    if (setup->layer_slot > 0) {
  358.       layer = *(unsigned*)v0[setup->layer_slot];
  359.       layer = MIN2(layer, scene->fb_max_layer);
  360.    }
  361.  
  362.    if (0)
  363.       print_point(setup, v0, size);
  364.  
  365.    /* Bounding rectangle (in pixels) */
  366.    if (!lp_context->rasterizer ||
  367.        lp_context->rasterizer->point_quad_rasterization) {
  368.       /*
  369.        * Rasterize points as quads.
  370.        */
  371.       int x0, y0;
  372.       /* Point size as fixed point integer, remove rounding errors
  373.        * and gives minimum width for very small points.
  374.        */
  375.       fixed_width = MAX2(FIXED_ONE, subpixel_snap(size));
  376.  
  377.       x0 = subpixel_snap(v0[0][0] - setup->pixel_offset) - fixed_width/2;
  378.       y0 = subpixel_snap(v0[0][1] - setup->pixel_offset) - fixed_width/2;
  379.  
  380.       bbox.x0 = (x0 + (FIXED_ONE-1)) >> FIXED_ORDER;
  381.       bbox.x1 = (x0 + fixed_width + (FIXED_ONE-1)) >> FIXED_ORDER;
  382.       bbox.y0 = (y0 + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
  383.       bbox.y1 = (y0 + fixed_width + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
  384.  
  385.       /* Inclusive coordinates:
  386.        */
  387.       bbox.x1--;
  388.       bbox.y1--;
  389.    } else {
  390.       /*
  391.        * OpenGL legacy rasterization rules for non-sprite points.
  392.        *
  393.        * Per OpenGL 2.1 spec, section 3.3.1, "Basic Point Rasterization".
  394.        *
  395.        * This type of point rasterization is only available in pre 3.0 contexts
  396.        * (or compatibilility contexts which we don't support) anyway.
  397.        */
  398.  
  399.       const int x0 = subpixel_snap(v0[0][0]);
  400.       const int y0 = subpixel_snap(v0[0][1]) - adj;
  401.  
  402.       int int_width;
  403.       /* Point size as fixed point integer. For GL legacy points
  404.        * the point size is always a whole integer.
  405.        */
  406.       fixed_width = MAX2(FIXED_ONE,
  407.                          (subpixel_snap(size) + FIXED_ONE/2 - 1) & ~(FIXED_ONE-1));
  408.       int_width = fixed_width >> FIXED_ORDER;
  409.  
  410.       assert(setup->pixel_offset != 0);
  411.  
  412.       if (int_width == 1) {
  413.          bbox.x0 = x0 >> FIXED_ORDER;
  414.          bbox.y0 = y0 >> FIXED_ORDER;
  415.          bbox.x1 = bbox.x0;
  416.          bbox.y1 = bbox.y0;
  417.       } else {
  418.          if (int_width & 1) {
  419.             /* Odd width */
  420.             bbox.x0 = (x0 >> FIXED_ORDER) - (int_width - 1)/2;
  421.             bbox.y0 = (y0 >> FIXED_ORDER) - (int_width - 1)/2;
  422.          } else {
  423.             /* Even width */
  424.             bbox.x0 = ((x0 + FIXED_ONE/2) >> FIXED_ORDER) - int_width/2;
  425.             bbox.y0 = ((y0 + FIXED_ONE/2) >> FIXED_ORDER) - int_width/2;
  426.          }
  427.  
  428.          bbox.x1 = bbox.x0 + int_width - 1;
  429.          bbox.y1 = bbox.y0 + int_width - 1;
  430.       }
  431.    }
  432.  
  433.    if (0) {
  434.       debug_printf("  bbox: (%i, %i) - (%i, %i)\n",
  435.                    bbox.x0, bbox.y0,
  436.                    bbox.x1, bbox.y1);
  437.    }
  438.  
  439.    if (!u_rect_test_intersection(&setup->draw_regions[viewport_index], &bbox)) {
  440.       if (0) debug_printf("offscreen\n");
  441.       LP_COUNT(nr_culled_tris);
  442.       return TRUE;
  443.    }
  444.  
  445.    u_rect_find_intersection(&setup->draw_regions[viewport_index], &bbox);
  446.  
  447.    point = lp_setup_alloc_triangle(scene,
  448.                                    key->num_inputs,
  449.                                    nr_planes,
  450.                                    &bytes);
  451.    if (!point)
  452.       return FALSE;
  453.  
  454. #ifdef DEBUG
  455.    point->v[0][0] = v0[0][0];
  456.    point->v[0][1] = v0[0][1];
  457. #endif
  458.  
  459.    LP_COUNT(nr_tris);
  460.  
  461.    if (lp_context->active_statistics_queries &&
  462.        !llvmpipe_rasterization_disabled(lp_context)) {
  463.       lp_context->pipeline_statistics.c_primitives++;
  464.    }
  465.  
  466.    if (draw_will_inject_frontface(lp_context->draw) &&
  467.        setup->face_slot > 0) {
  468.       point->inputs.frontfacing = v0[setup->face_slot][0];
  469.    } else {
  470.       point->inputs.frontfacing = TRUE;
  471.    }
  472.  
  473.    info.v0 = v0;
  474.    info.dx01 = 0;
  475.    info.dx12 = fixed_width;
  476.    info.dy01 = fixed_width;
  477.    info.dy12 = 0;
  478.    info.a0 = GET_A0(&point->inputs);
  479.    info.dadx = GET_DADX(&point->inputs);
  480.    info.dady = GET_DADY(&point->inputs);
  481.    info.frontfacing = point->inputs.frontfacing;
  482.    
  483.    /* Setup parameter interpolants:
  484.     */
  485.    setup_point_coefficients(setup, &info);
  486.  
  487.    point->inputs.disable = FALSE;
  488.    point->inputs.opaque = FALSE;
  489.    point->inputs.layer = layer;
  490.    point->inputs.viewport_index = viewport_index;
  491.  
  492.    {
  493.       struct lp_rast_plane *plane = GET_PLANES(point);
  494.  
  495.       plane[0].dcdx = -1;
  496.       plane[0].dcdy = 0;
  497.       plane[0].c = 1-bbox.x0;
  498.       plane[0].eo = 1;
  499.  
  500.       plane[1].dcdx = 1;
  501.       plane[1].dcdy = 0;
  502.       plane[1].c = bbox.x1+1;
  503.       plane[1].eo = 0;
  504.  
  505.       plane[2].dcdx = 0;
  506.       plane[2].dcdy = 1;
  507.       plane[2].c = 1-bbox.y0;
  508.       plane[2].eo = 1;
  509.  
  510.       plane[3].dcdx = 0;
  511.       plane[3].dcdy = -1;
  512.       plane[3].c = bbox.y1+1;
  513.       plane[3].eo = 0;
  514.    }
  515.  
  516.    return lp_setup_bin_triangle(setup, point, &bbox, nr_planes, viewport_index);
  517. }
  518.  
  519.  
  520. static void
  521. lp_setup_point(struct lp_setup_context *setup,
  522.                const float (*v0)[4])
  523. {
  524.    if (!try_setup_point( setup, v0 ))
  525.    {
  526.       if (!lp_setup_flush_and_restart(setup))
  527.          return;
  528.  
  529.       if (!try_setup_point( setup, v0 ))
  530.          return;
  531.    }
  532. }
  533.  
  534.  
  535. void
  536. lp_setup_choose_point( struct lp_setup_context *setup )
  537. {
  538.    setup->point = lp_setup_point;
  539. }
  540.  
  541.  
  542.