"Fossies" - the Fresh Open Source Software Archive

Member "mesa-20.1.8/src/gallium/auxiliary/gallivm/lp_bld_quad.c" (16 Sep 2020, 7274 Bytes) of package /linux/misc/mesa-20.1.8.tar.xz:


As a special service "Fossies" has tried to format the requested source page into HTML format using (guessed) C and C++ source code syntax highlighting (style: standard) with prefixed line numbers and code folding option. Alternatively you can here view or download the uninterpreted source code file. For more information about "lp_bld_quad.c" see the Fossies "Dox" file reference documentation.

    1 /**************************************************************************
    2  *
    3  * Copyright 2010 VMware, Inc.
    4  * All Rights Reserved.
    5  *
    6  * Permission is hereby granted, free of charge, to any person obtaining a
    7  * copy of this software and associated documentation files (the
    8  * "Software"), to deal in the Software without restriction, including
    9  * without limitation the rights to use, copy, modify, merge, publish,
   10  * distribute, sub license, and/or sell copies of the Software, and to
   11  * permit persons to whom the Software is furnished to do so, subject to
   12  * the following conditions:
   13  *
   14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
   15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
   16  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
   17  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
   18  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
   19  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
   20  * USE OR OTHER DEALINGS IN THE SOFTWARE.
   21  *
   22  * The above copyright notice and this permission notice (including the
   23  * next paragraph) shall be included in all copies or substantial portions
   24  * of the Software.
   25  *
   26  **************************************************************************/
   27 
   28 
   29 #include "lp_bld_type.h"
   30 #include "lp_bld_arit.h"
   31 #include "lp_bld_const.h"
   32 #include "lp_bld_swizzle.h"
   33 #include "lp_bld_quad.h"
   34 #include "lp_bld_pack.h"
   35 
   36 
   37 static const unsigned char
   38 swizzle_left[4] = {
   39    LP_BLD_QUAD_TOP_LEFT,     LP_BLD_QUAD_TOP_LEFT,
   40    LP_BLD_QUAD_BOTTOM_LEFT,  LP_BLD_QUAD_BOTTOM_LEFT
   41 };
   42 
   43 static const unsigned char
   44 swizzle_right[4] = {
   45    LP_BLD_QUAD_TOP_RIGHT,    LP_BLD_QUAD_TOP_RIGHT,
   46    LP_BLD_QUAD_BOTTOM_RIGHT, LP_BLD_QUAD_BOTTOM_RIGHT
   47 };
   48 
   49 static const unsigned char
   50 swizzle_top[4] = {
   51    LP_BLD_QUAD_TOP_LEFT,     LP_BLD_QUAD_TOP_RIGHT,
   52    LP_BLD_QUAD_TOP_LEFT,     LP_BLD_QUAD_TOP_RIGHT
   53 };
   54 
   55 static const unsigned char
   56 swizzle_bottom[4] = {
   57    LP_BLD_QUAD_BOTTOM_LEFT,  LP_BLD_QUAD_BOTTOM_RIGHT,
   58    LP_BLD_QUAD_BOTTOM_LEFT,  LP_BLD_QUAD_BOTTOM_RIGHT
   59 };
   60 
   61 
   62 LLVMValueRef
   63 lp_build_ddx(struct lp_build_context *bld,
   64              LLVMValueRef a)
   65 {
   66    LLVMValueRef a_left  = lp_build_swizzle_aos(bld, a, swizzle_left);
   67    LLVMValueRef a_right = lp_build_swizzle_aos(bld, a, swizzle_right);
   68    return lp_build_sub(bld, a_right, a_left);
   69 }
   70 
   71 
   72 LLVMValueRef
   73 lp_build_ddy(struct lp_build_context *bld,
   74              LLVMValueRef a)
   75 {
   76    LLVMValueRef a_top    = lp_build_swizzle_aos(bld, a, swizzle_top);
   77    LLVMValueRef a_bottom = lp_build_swizzle_aos(bld, a, swizzle_bottom);
   78    return lp_build_sub(bld, a_bottom, a_top);
   79 }
   80 
   81 /*
   82  * Helper for building packed ddx/ddy vector for one coord (scalar per quad
   83  * values). The vector will look like this (8-wide):
   84  * dr1dx _____ -dr1dy _____ dr2dx _____ -dr2dy _____
   85  * This only requires one shuffle instead of two for more straightforward packing.
   86  */
   87 LLVMValueRef
   88 lp_build_packed_ddx_ddy_onecoord(struct lp_build_context *bld,
   89                                  LLVMValueRef a)
   90 {
   91    struct gallivm_state *gallivm = bld->gallivm;
   92    LLVMBuilderRef builder = gallivm->builder;
   93    LLVMValueRef vec1, vec2;
   94 
   95    /* use aos swizzle helper */
   96 
   97    static const unsigned char swizzle1[] = { /* no-op swizzle */
   98       LP_BLD_QUAD_TOP_LEFT, LP_BLD_SWIZZLE_DONTCARE,
   99       LP_BLD_QUAD_BOTTOM_LEFT, LP_BLD_SWIZZLE_DONTCARE
  100    };
  101    static const unsigned char swizzle2[] = {
  102       LP_BLD_QUAD_TOP_RIGHT, LP_BLD_SWIZZLE_DONTCARE,
  103       LP_BLD_QUAD_TOP_LEFT, LP_BLD_SWIZZLE_DONTCARE
  104    };
  105 
  106    vec1 = lp_build_swizzle_aos(bld, a, swizzle1);
  107    vec2 = lp_build_swizzle_aos(bld, a, swizzle2);
  108 
  109    if (bld->type.floating)
  110       return LLVMBuildFSub(builder, vec2, vec1, "ddxddy");
  111    else
  112       return LLVMBuildSub(builder, vec2, vec1, "ddxddy");
  113 }
  114 
  115 
  116 /*
  117  * Helper for building packed ddx/ddy vector for one coord (scalar per quad
  118  * values). The vector will look like this (8-wide):
  119  * ds1dx ds1dy dt1dx dt1dy ds2dx ds2dy dt2dx dt2dy
  120  * This only needs 2 (v)shufps.
  121  */
  122 LLVMValueRef
  123 lp_build_packed_ddx_ddy_twocoord(struct lp_build_context *bld,
  124                                  LLVMValueRef a, LLVMValueRef b)
  125 {
  126    struct gallivm_state *gallivm = bld->gallivm;
  127    LLVMBuilderRef builder = gallivm->builder;
  128    LLVMValueRef shuffles1[LP_MAX_VECTOR_LENGTH/4];
  129    LLVMValueRef shuffles2[LP_MAX_VECTOR_LENGTH/4];
  130    LLVMValueRef vec1, vec2;
  131    unsigned length, num_quads, i;
  132 
  133    /* XXX: do hsub version */
  134    length = bld->type.length;
  135    num_quads = length / 4;
  136    for (i = 0; i < num_quads; i++) {
  137       unsigned s1 = 4 * i;
  138       unsigned s2 = 4 * i + length;
  139       shuffles1[4*i + 0] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_LEFT + s1);
  140       shuffles1[4*i + 1] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_LEFT + s1);
  141       shuffles1[4*i + 2] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_LEFT + s2);
  142       shuffles1[4*i + 3] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_LEFT + s2);
  143       shuffles2[4*i + 0] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_RIGHT + s1);
  144       shuffles2[4*i + 1] = lp_build_const_int32(gallivm, LP_BLD_QUAD_BOTTOM_LEFT + s1);
  145       shuffles2[4*i + 2] = lp_build_const_int32(gallivm, LP_BLD_QUAD_TOP_RIGHT + s2);
  146       shuffles2[4*i + 3] = lp_build_const_int32(gallivm, LP_BLD_QUAD_BOTTOM_LEFT + s2);
  147    }
  148    vec1 = LLVMBuildShuffleVector(builder, a, b,
  149                                  LLVMConstVector(shuffles1, length), "");
  150    vec2 = LLVMBuildShuffleVector(builder, a, b,
  151                                  LLVMConstVector(shuffles2, length), "");
  152    if (bld->type.floating)
  153       return LLVMBuildFSub(builder, vec2, vec1, "ddxddyddxddy");
  154    else
  155       return LLVMBuildSub(builder, vec2, vec1, "ddxddyddxddy");
  156 }
  157 
  158 
  159 /**
  160  * Twiddle from quad format to row format
  161  *
  162  *   src0      src1
  163  * ######### #########      #################
  164  * # 0 | 1 # # 4 | 5 #      # 0 | 1 | 4 | 5 # src0
  165  * #---+---# #---+---#  ->  #################
  166  * # 2 | 3 # # 6 | 7 #      # 2 | 3 | 6 | 7 # src1
  167  * ######### #########      #################
  168  *
  169  */
  170 void
  171 lp_bld_quad_twiddle(struct gallivm_state *gallivm,
  172                     struct lp_type lp_dst_type,
  173                     const LLVMValueRef* src,
  174                     unsigned src_count,
  175                     LLVMValueRef* dst)
  176 {
  177    LLVMBuilderRef builder = gallivm->builder;
  178    LLVMTypeRef dst_type_ref;
  179    LLVMTypeRef type2_ref;
  180    struct lp_type type2;
  181    unsigned i;
  182 
  183    assert((src_count % 2) == 0);
  184 
  185    /* Create a type with only 2 elements */
  186    type2 = lp_dst_type;
  187    type2.width = (lp_dst_type.width * lp_dst_type.length) / 2;
  188    type2.length = 2;
  189    type2.floating = 0;
  190 
  191    type2_ref = lp_build_vec_type(gallivm, type2);
  192    dst_type_ref = lp_build_vec_type(gallivm, lp_dst_type);
  193 
  194    for (i = 0; i < src_count; i += 2) {
  195       LLVMValueRef src0, src1;
  196 
  197       src0 = LLVMBuildBitCast(builder, src[i + 0], type2_ref, "");
  198       src1 = LLVMBuildBitCast(builder, src[i + 1], type2_ref, "");
  199 
  200       dst[i + 0] = lp_build_interleave2(gallivm, type2, src0, src1, 0);
  201       dst[i + 1] = lp_build_interleave2(gallivm, type2, src0, src1, 1);
  202 
  203       dst[i + 0] = LLVMBuildBitCast(builder, dst[i + 0], dst_type_ref, "");
  204       dst[i + 1] = LLVMBuildBitCast(builder, dst[i + 1], dst_type_ref, "");
  205    }
  206 }