On 02/06/2015 06:56 AM, Ilia Mirkin wrote:
> From: Dave Airlie <airl...@gmail.com>
> 
> Signed-off-by: Dave Airlie <airl...@redhat.com>
> ---
>  src/glsl/ir_set_program_inouts.cpp | 28 +++++++++++++++++++++++++---
>  1 file changed, 25 insertions(+), 3 deletions(-)
> 
> diff --git a/src/glsl/ir_set_program_inouts.cpp 
> b/src/glsl/ir_set_program_inouts.cpp
> index 97ead75..b38742c 100644
> --- a/src/glsl/ir_set_program_inouts.cpp
> +++ b/src/glsl/ir_set_program_inouts.cpp
> @@ -81,6 +81,16 @@ is_shader_inout(ir_variable *var)
>            var->data.mode == ir_var_system_value;
>  }
>  
> +static inline bool
> +is_dvec34_inout(ir_variable *var)
> +{
> +   const glsl_type *type = var->type->without_array();
> +   if (type == glsl_type::dvec4_type || type == glsl_type::dvec3_type)
> +      return true;
> +
> +   return false;

Why not just

   const glsl_type *const type = var->type->without_array();
   return type == glsl_type::dvec4_type || type == glsl_type::dvec3_type;

It may also be better to name this something different.  We'll do the
same "doubling" if / when we add support for GL_AMD_gpu_shader_int64.

> +}
> +
>  static void
>  mark(struct gl_program *prog, ir_variable *var, int offset, int len,
>       bool is_fragment_shader)
> @@ -94,19 +104,31 @@ mark(struct gl_program *prog, ir_variable *var, int 
> offset, int len,
>      */
>  
>     for (int i = 0; i < len; i++) {
> +      /* XXX Should it be i * 2 for dvec3/4? */
> +      int idx = var->data.location + var->data.index + offset + i;

I believe it should be i * 2.  Otherwise elements 0 and 1 of a dvec4
array will partially overlap.  That seems... bad.

>        GLbitfield64 bitfield =
> -         BITFIELD64_BIT(var->data.location + var->data.index + offset + i);
> +         BITFIELD64_BIT(idx);
> +
> +      /* dvec3 and dvec4 take up 2 slots */
> +      if (is_dvec34_inout(var))
> +         bitfield |= bitfield << 1;
>        if (var->data.mode == ir_var_shader_in) {
>        prog->InputsRead |= bitfield;
>           if (is_fragment_shader) {
>              gl_fragment_program *fprog = (gl_fragment_program *) prog;
> -            fprog->InterpQualifier[var->data.location +
> -                                   var->data.index + offset + i] =
> +            fprog->InterpQualifier[idx] =
>                 (glsl_interp_qualifier) var->data.interpolation;
>              if (var->data.centroid)
>                 fprog->IsCentroid |= bitfield;
>              if (var->data.sample)
>                 fprog->IsSample |= bitfield;
> +
> +            /* Set the InterpQualifier of the next slot to the same as the
> +             * current one, since dvec3 and dvec4 spans 2 slots.
> +             */
> +            if (is_dvec34_inout(var))
> +               fprog->InterpQualifier[idx + 1] =
> +                  (glsl_interp_qualifier) var->data.interpolation;
>           }
>        } else if (var->data.mode == ir_var_system_value) {
>           prog->SystemValuesRead |= bitfield;
> 

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
http://lists.freedesktop.org/mailman/listinfo/mesa-dev

Reply via email to