[Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-08-14 Thread Iago Toral Quiroga
From: Samuel Iglesias Gonsalvez 

Currently, gen6 only uses geometry shaders for transform feedback so the state
we emit is not suitable to accomodate general purpose, user-provided geometry
shaders. This patch paves the way to add these support and the needed
3DSTATE_GS packet modifications for it.

Previous code that emitted state to implement transform feedback in gen6 goes
to upload_gs_state_adhoc_tf().

Signed-off-by: Samuel Iglesias Gonsalvez 
---
 src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 ++
 1 file changed, 94 insertions(+), 11 deletions(-)

diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
b/src/mesa/drivers/dri/i965/gen6_gs_state.c
index 9648fb7..e132959 100644
--- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
+++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
@@ -31,7 +31,7 @@
 #include "intel_batchbuffer.h"
 
 static void
-upload_gs_state(struct brw_context *brw)
+upload_gs_state_for_tf(struct brw_context *brw)
 {
/* Disable all the constant buffers. */
BEGIN_BATCH(5);
@@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
   OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
   OUT_BATCH(0); /* no scratch space */
   OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
-   (brw->ff_gs.prog_data->urb_read_length << 
GEN6_GS_URB_READ_LENGTH_SHIFT));
+(brw->ff_gs.prog_data->urb_read_length << 
GEN6_GS_URB_READ_LENGTH_SHIFT));
   OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
-   GEN6_GS_STATISTICS_ENABLE |
-   GEN6_GS_SO_STATISTICS_ENABLE |
-   GEN6_GS_RENDERING_ENABLE);
+GEN6_GS_STATISTICS_ENABLE |
+GEN6_GS_SO_STATISTICS_ENABLE |
+GEN6_GS_RENDERING_ENABLE);
   OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
 GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
 (brw->ff_gs.prog_data->svbi_postincrement_value <<
@@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
   OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
   OUT_BATCH(0); /* prog_bo */
   OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
-   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
+(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
   OUT_BATCH(0); /* scratch space base offset */
   OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
-   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
-   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
+(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
+(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
   OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
-   GEN6_GS_STATISTICS_ENABLE |
-   GEN6_GS_RENDERING_ENABLE);
+GEN6_GS_STATISTICS_ENABLE |
+GEN6_GS_RENDERING_ENABLE);
+  OUT_BATCH(0);
+  ADVANCE_BATCH();
+   }
+}
+
+static void
+upload_gs_state(struct brw_context *brw)
+{
+   /* BRW_NEW_GEOMETRY_PROGRAM */
+   bool active = brw->geometry_program;
+   /* CACHE_NEW_GS_PROG */
+   const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
+   const struct brw_stage_state *stage_state = &brw->gs.base;
+
+   if (active) {
+  /* FIXME: enable constant buffers */
+  BEGIN_BATCH(5);
+  OUT_BATCH(_3DSTATE_CONSTANT_GS << 16 | (5 - 2));
+  OUT_BATCH(0);
+  OUT_BATCH(0);
   OUT_BATCH(0);
+  OUT_BATCH(0);
+  ADVANCE_BATCH();
+
+  BEGIN_BATCH(7);
+  OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
+  OUT_BATCH(stage_state->prog_offset);
+
+  /* GEN6_GS_SPF_MODE and GEN6_GS_VECTOR_MASK_ENABLE are enabled as it
+   * was previously done for gen6.
+   *
+   * TODO: test with both disabled to see if the HW is behaving
+   * as expected, like in gen7.
+   */
+  OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE |
+((ALIGN(stage_state->sampler_count, 4)/4) <<
+ GEN6_GS_SAMPLER_COUNT_SHIFT) |
+((prog_data->base.binding_table.size_bytes / 4) <<
+ GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
+
+  if (prog_data->total_scratch) {
+ OUT_RELOC(stage_state->scratch_bo,
+   I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
+   ffs(prog_data->total_scratch) - 11);
+  } else {
+ OUT_BATCH(0); /* no scratch space */
+  }
+
+  OUT_BATCH((prog_data->urb_read_length <<
+ GEN6_GS_URB_READ_LENGTH_SHIFT) |
+(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT) |
+(prog_data->base.dispatch_grf_start_reg <<
+ GEN6_GS_DISPATCH_START_GRF_SHIFT));
+
+  OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
+GEN6_GS_STATISTICS_ENABLE |
+GEN6_GS_SO_STATISTICS_ENABLE |
+GEN6_GS_RENDERING_ENABLE);
+
+  /* FIXME: Enable SVBI payload only when TF is enable in SNB for
+  

Re: [Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-09-03 Thread Jordan Justen
Rather than:
i965/gen6/gs: refactor gen6_gs_state

How about something like:
i965/gen6/gs: Skeleton for user GS program support

(more below)

On Thu, Aug 14, 2014 at 4:11 AM, Iago Toral Quiroga  wrote:
> From: Samuel Iglesias Gonsalvez 
>
> Currently, gen6 only uses geometry shaders for transform feedback so the state
> we emit is not suitable to accomodate general purpose, user-provided geometry
> shaders. This patch paves the way to add these support and the needed
> 3DSTATE_GS packet modifications for it.
>
> Previous code that emitted state to implement transform feedback in gen6 goes
> to upload_gs_state_adhoc_tf().
>
> Signed-off-by: Samuel Iglesias Gonsalvez 
> ---
>  src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 
> ++
>  1 file changed, 94 insertions(+), 11 deletions(-)
>
> diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
> b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> index 9648fb7..e132959 100644
> --- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
> +++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> @@ -31,7 +31,7 @@
>  #include "intel_batchbuffer.h"
>
>  static void
> -upload_gs_state(struct brw_context *brw)
> +upload_gs_state_for_tf(struct brw_context *brw)
>  {
> /* Disable all the constant buffers. */
> BEGIN_BATCH(5);
> @@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
>OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
>OUT_BATCH(0); /* no scratch space */
>OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> -   (brw->ff_gs.prog_data->urb_read_length << 
> GEN6_GS_URB_READ_LENGTH_SHIFT));
> +(brw->ff_gs.prog_data->urb_read_length << 
> GEN6_GS_URB_READ_LENGTH_SHIFT));
>OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
> -   GEN6_GS_STATISTICS_ENABLE |
> -   GEN6_GS_SO_STATISTICS_ENABLE |
> -   GEN6_GS_RENDERING_ENABLE);
> +GEN6_GS_STATISTICS_ENABLE |
> +GEN6_GS_SO_STATISTICS_ENABLE |
> +GEN6_GS_RENDERING_ENABLE);

This looks like tabs to spaces conversion. For lines that need to be
changed, it is good to do that conversion. But, in this case, the only
change is the name of the function.

>OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
>  GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
>  (brw->ff_gs.prog_data->svbi_postincrement_value <<
> @@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
>OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
>OUT_BATCH(0); /* prog_bo */
>OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
> -   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> +(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
>OUT_BATCH(0); /* scratch space base offset */
>OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> -   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> -   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> +(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> +(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
>OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
> -   GEN6_GS_STATISTICS_ENABLE |
> -   GEN6_GS_RENDERING_ENABLE);
> +GEN6_GS_STATISTICS_ENABLE |
> +GEN6_GS_RENDERING_ENABLE);
> +  OUT_BATCH(0);
> +  ADVANCE_BATCH();
> +   }
> +}
> +
> +static void
> +upload_gs_state(struct brw_context *brw)
> +{
> +   /* BRW_NEW_GEOMETRY_PROGRAM */
> +   bool active = brw->geometry_program;
> +   /* CACHE_NEW_GS_PROG */
> +   const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
> +   const struct brw_stage_state *stage_state = &brw->gs.base;
> +
> +   if (active) {
> +  /* FIXME: enable constant buffers */
> +  BEGIN_BATCH(5);
> +  OUT_BATCH(_3DSTATE_CONSTANT_GS << 16 | (5 - 2));
> +  OUT_BATCH(0);
> +  OUT_BATCH(0);
>OUT_BATCH(0);
> +  OUT_BATCH(0);
> +  ADVANCE_BATCH();
> +
> +  BEGIN_BATCH(7);
> +  OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> +  OUT_BATCH(stage_state->prog_offset);
> +
> +  /* GEN6_GS_SPF_MODE and GEN6_GS_VECTOR_MASK_ENABLE are enabled as it
> +   * was previously done for gen6.
> +   *
> +   * TODO: test with both disabled to see if the HW is behaving
> +   * as expected, like in gen7.
> +   */
> +  OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE |
> +((ALIGN(stage_state->sampler_count, 4)/4) <<
> + GEN6_GS_SAMPLER_COUNT_SHIFT) |
> +((prog_data->base.binding_table.size_bytes / 4) <<
> + GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> +
> +  if (prog_data->total_scratch) {
> + OUT_RELOC(stage_state->scratch_bo,
> +   I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
> +   ffs(prog_data->total_scratch) - 11);
> +  } else {
> + OUT_BATCH(0); /* no 

Re: [Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-09-03 Thread Iago Toral Quiroga
On mié, 2014-09-03 at 18:51 -0700, Jordan Justen wrote:
> Rather than:
> i965/gen6/gs: refactor gen6_gs_state
> 
> How about something like:
> i965/gen6/gs: Skeleton for user GS program support

Sure, that sounds good to me.

> (more below)
> 
> On Thu, Aug 14, 2014 at 4:11 AM, Iago Toral Quiroga  wrote:
> > From: Samuel Iglesias Gonsalvez 
> >
> > Currently, gen6 only uses geometry shaders for transform feedback so the 
> > state
> > we emit is not suitable to accomodate general purpose, user-provided 
> > geometry
> > shaders. This patch paves the way to add these support and the needed
> > 3DSTATE_GS packet modifications for it.
> >
> > Previous code that emitted state to implement transform feedback in gen6 
> > goes
> > to upload_gs_state_adhoc_tf().
> >
> > Signed-off-by: Samuel Iglesias Gonsalvez 
> > ---
> >  src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 
> > ++
> >  1 file changed, 94 insertions(+), 11 deletions(-)
> >
> > diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
> > b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > index 9648fb7..e132959 100644
> > --- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > +++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > @@ -31,7 +31,7 @@
> >  #include "intel_batchbuffer.h"
> >
> >  static void
> > -upload_gs_state(struct brw_context *brw)
> > +upload_gs_state_for_tf(struct brw_context *brw)
> >  {
> > /* Disable all the constant buffers. */
> > BEGIN_BATCH(5);
> > @@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
> >OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
> >OUT_BATCH(0); /* no scratch space */
> >OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> > -   (brw->ff_gs.prog_data->urb_read_length << 
> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> > +(brw->ff_gs.prog_data->urb_read_length << 
> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> >OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
> > -   GEN6_GS_STATISTICS_ENABLE |
> > -   GEN6_GS_SO_STATISTICS_ENABLE |
> > -   GEN6_GS_RENDERING_ENABLE);
> > +GEN6_GS_STATISTICS_ENABLE |
> > +GEN6_GS_SO_STATISTICS_ENABLE |
> > +GEN6_GS_RENDERING_ENABLE);
> 
> This looks like tabs to spaces conversion. For lines that need to be
> changed, it is good to do that conversion. But, in this case, the only
> change is the name of the function.

Okay.

You granted the reviewed-by anyway though, so I understand that this
comment is only for reference. Or would you prefer that we remove these
changes from the patch?

> >OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
> >  GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
> >  (brw->ff_gs.prog_data->svbi_postincrement_value <<
> > @@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
> >OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> >OUT_BATCH(0); /* prog_bo */
> >OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
> > -   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> > +(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> >OUT_BATCH(0); /* scratch space base offset */
> >OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> > -   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> > -   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> > +(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> > +(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> >OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
> > -   GEN6_GS_STATISTICS_ENABLE |
> > -   GEN6_GS_RENDERING_ENABLE);
> > +GEN6_GS_STATISTICS_ENABLE |
> > +GEN6_GS_RENDERING_ENABLE);
> > +  OUT_BATCH(0);
> > +  ADVANCE_BATCH();
> > +   }
> > +}
> > +
> > +static void
> > +upload_gs_state(struct brw_context *brw)
> > +{
> > +   /* BRW_NEW_GEOMETRY_PROGRAM */
> > +   bool active = brw->geometry_program;
> > +   /* CACHE_NEW_GS_PROG */
> > +   const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
> > +   const struct brw_stage_state *stage_state = &brw->gs.base;
> > +
> > +   if (active) {
> > +  /* FIXME: enable constant buffers */
> > +  BEGIN_BATCH(5);
> > +  OUT_BATCH(_3DSTATE_CONSTANT_GS << 16 | (5 - 2));
> > +  OUT_BATCH(0);
> > +  OUT_BATCH(0);
> >OUT_BATCH(0);
> > +  OUT_BATCH(0);
> > +  ADVANCE_BATCH();
> > +
> > +  BEGIN_BATCH(7);
> > +  OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> > +  OUT_BATCH(stage_state->prog_offset);
> > +
> > +  /* GEN6_GS_SPF_MODE and GEN6_GS_VECTOR_MASK_ENABLE are enabled as it
> > +   * was previously done for gen6.
> > +   *
> > +   * TODO: test with both disabled to see if the HW is behaving
> > +   * as expected, like in gen7.
> > +   */
> > +  OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE |
> > +   

Re: [Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-09-04 Thread Jordan Justen
On Wed, Sep 3, 2014 at 11:33 PM, Iago Toral Quiroga  wrote:
> On mié, 2014-09-03 at 18:51 -0700, Jordan Justen wrote:
>> Rather than:
>> i965/gen6/gs: refactor gen6_gs_state
>>
>> How about something like:
>> i965/gen6/gs: Skeleton for user GS program support
>
> Sure, that sounds good to me.
>
>> (more below)
>>
>> On Thu, Aug 14, 2014 at 4:11 AM, Iago Toral Quiroga  
>> wrote:
>> > From: Samuel Iglesias Gonsalvez 
>> >
>> > Currently, gen6 only uses geometry shaders for transform feedback so the 
>> > state
>> > we emit is not suitable to accomodate general purpose, user-provided 
>> > geometry
>> > shaders. This patch paves the way to add these support and the needed
>> > 3DSTATE_GS packet modifications for it.
>> >
>> > Previous code that emitted state to implement transform feedback in gen6 
>> > goes
>> > to upload_gs_state_adhoc_tf().
>> >
>> > Signed-off-by: Samuel Iglesias Gonsalvez 
>> > ---
>> >  src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 
>> > ++
>> >  1 file changed, 94 insertions(+), 11 deletions(-)
>> >
>> > diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
>> > b/src/mesa/drivers/dri/i965/gen6_gs_state.c
>> > index 9648fb7..e132959 100644
>> > --- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
>> > +++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
>> > @@ -31,7 +31,7 @@
>> >  #include "intel_batchbuffer.h"
>> >
>> >  static void
>> > -upload_gs_state(struct brw_context *brw)
>> > +upload_gs_state_for_tf(struct brw_context *brw)
>> >  {
>> > /* Disable all the constant buffers. */
>> > BEGIN_BATCH(5);
>> > @@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
>> >OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
>> >OUT_BATCH(0); /* no scratch space */
>> >OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
>> > -   (brw->ff_gs.prog_data->urb_read_length << 
>> > GEN6_GS_URB_READ_LENGTH_SHIFT));
>> > +(brw->ff_gs.prog_data->urb_read_length << 
>> > GEN6_GS_URB_READ_LENGTH_SHIFT));
>> >OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
>> > -   GEN6_GS_STATISTICS_ENABLE |
>> > -   GEN6_GS_SO_STATISTICS_ENABLE |
>> > -   GEN6_GS_RENDERING_ENABLE);
>> > +GEN6_GS_STATISTICS_ENABLE |
>> > +GEN6_GS_SO_STATISTICS_ENABLE |
>> > +GEN6_GS_RENDERING_ENABLE);
>>
>> This looks like tabs to spaces conversion. For lines that need to be
>> changed, it is good to do that conversion. But, in this case, the only
>> change is the name of the function.
>
> Okay.
>
> You granted the reviewed-by anyway though, so I understand that this
> comment is only for reference. Or would you prefer that we remove these
> changes from the patch?

Could you clean it up? It makes review easier, both now, and in
looking back through the history. (also, git blame...)

Thanks,

-Jordan

>> >OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
>> >  GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
>> >  (brw->ff_gs.prog_data->svbi_postincrement_value <<
>> > @@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
>> >OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
>> >OUT_BATCH(0); /* prog_bo */
>> >OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
>> > -   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
>> > +(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
>> >OUT_BATCH(0); /* scratch space base offset */
>> >OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
>> > -   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
>> > -   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
>> > +(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
>> > +(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
>> >OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
>> > -   GEN6_GS_STATISTICS_ENABLE |
>> > -   GEN6_GS_RENDERING_ENABLE);
>> > +GEN6_GS_STATISTICS_ENABLE |
>> > +GEN6_GS_RENDERING_ENABLE);
>> > +  OUT_BATCH(0);
>> > +  ADVANCE_BATCH();
>> > +   }
>> > +}
>> > +
>> > +static void
>> > +upload_gs_state(struct brw_context *brw)
>> > +{
>> > +   /* BRW_NEW_GEOMETRY_PROGRAM */
>> > +   bool active = brw->geometry_program;
>> > +   /* CACHE_NEW_GS_PROG */
>> > +   const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
>> > +   const struct brw_stage_state *stage_state = &brw->gs.base;
>> > +
>> > +   if (active) {
>> > +  /* FIXME: enable constant buffers */
>> > +  BEGIN_BATCH(5);
>> > +  OUT_BATCH(_3DSTATE_CONSTANT_GS << 16 | (5 - 2));
>> > +  OUT_BATCH(0);
>> > +  OUT_BATCH(0);
>> >OUT_BATCH(0);
>> > +  OUT_BATCH(0);
>> > +  ADVANCE_BATCH();
>> > +
>> > +  BEGIN_BATCH(7);
>> > +  OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
>> > +  OUT_BATCH(stage_state->prog_offset);
>> > +
>> > +  /* GEN6_GS_SPF_MODE a

Re: [Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-09-04 Thread Iago Toral Quiroga
On jue, 2014-09-04 at 00:44 -0700, Jordan Justen wrote:
> On Wed, Sep 3, 2014 at 11:33 PM, Iago Toral Quiroga  wrote:
> > On mié, 2014-09-03 at 18:51 -0700, Jordan Justen wrote:
> >> Rather than:
> >> i965/gen6/gs: refactor gen6_gs_state
> >>
> >> How about something like:
> >> i965/gen6/gs: Skeleton for user GS program support
> >
> > Sure, that sounds good to me.
> >
> >> (more below)
> >>
> >> On Thu, Aug 14, 2014 at 4:11 AM, Iago Toral Quiroga  
> >> wrote:
> >> > From: Samuel Iglesias Gonsalvez 
> >> >
> >> > Currently, gen6 only uses geometry shaders for transform feedback so the 
> >> > state
> >> > we emit is not suitable to accomodate general purpose, user-provided 
> >> > geometry
> >> > shaders. This patch paves the way to add these support and the needed
> >> > 3DSTATE_GS packet modifications for it.
> >> >
> >> > Previous code that emitted state to implement transform feedback in gen6 
> >> > goes
> >> > to upload_gs_state_adhoc_tf().
> >> >
> >> > Signed-off-by: Samuel Iglesias Gonsalvez 
> >> > ---
> >> >  src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 
> >> > ++
> >> >  1 file changed, 94 insertions(+), 11 deletions(-)
> >> >
> >> > diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
> >> > b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> >> > index 9648fb7..e132959 100644
> >> > --- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
> >> > +++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> >> > @@ -31,7 +31,7 @@
> >> >  #include "intel_batchbuffer.h"
> >> >
> >> >  static void
> >> > -upload_gs_state(struct brw_context *brw)
> >> > +upload_gs_state_for_tf(struct brw_context *brw)
> >> >  {
> >> > /* Disable all the constant buffers. */
> >> > BEGIN_BATCH(5);
> >> > @@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
> >> >OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
> >> >OUT_BATCH(0); /* no scratch space */
> >> >OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> >> > -   (brw->ff_gs.prog_data->urb_read_length << 
> >> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> >> > +(brw->ff_gs.prog_data->urb_read_length << 
> >> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> >> >OUT_BATCH(((brw->max_gs_threads - 1) << 
> >> > GEN6_GS_MAX_THREADS_SHIFT) |
> >> > -   GEN6_GS_STATISTICS_ENABLE |
> >> > -   GEN6_GS_SO_STATISTICS_ENABLE |
> >> > -   GEN6_GS_RENDERING_ENABLE);
> >> > +GEN6_GS_STATISTICS_ENABLE |
> >> > +GEN6_GS_SO_STATISTICS_ENABLE |
> >> > +GEN6_GS_RENDERING_ENABLE);
> >>
> >> This looks like tabs to spaces conversion. For lines that need to be
> >> changed, it is good to do that conversion. But, in this case, the only
> >> change is the name of the function.
> >
> > Okay.
> >
> > You granted the reviewed-by anyway though, so I understand that this
> > comment is only for reference. Or would you prefer that we remove these
> > changes from the patch?
> 
> Could you clean it up? It makes review easier, both now, and in
> looking back through the history. (also, git blame...)
> 
> Thanks,

Sure, no problem.

Iago

> -Jordan
> 
> >> >OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
> >> >  GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
> >> >  (brw->ff_gs.prog_data->svbi_postincrement_value <<
> >> > @@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
> >> >OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> >> >OUT_BATCH(0); /* prog_bo */
> >> >OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
> >> > -   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> >> > +(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> >> >OUT_BATCH(0); /* scratch space base offset */
> >> >OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> >> > -   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> >> > -   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> >> > +(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> >> > +(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> >> >OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
> >> > -   GEN6_GS_STATISTICS_ENABLE |
> >> > -   GEN6_GS_RENDERING_ENABLE);
> >> > +GEN6_GS_STATISTICS_ENABLE |
> >> > +GEN6_GS_RENDERING_ENABLE);
> >> > +  OUT_BATCH(0);
> >> > +  ADVANCE_BATCH();
> >> > +   }
> >> > +}
> >> > +
> >> > +static void
> >> > +upload_gs_state(struct brw_context *brw)
> >> > +{
> >> > +   /* BRW_NEW_GEOMETRY_PROGRAM */
> >> > +   bool active = brw->geometry_program;
> >> > +   /* CACHE_NEW_GS_PROG */
> >> > +   const struct brw_vec4_prog_data *prog_data = 
> >> > &brw->gs.prog_data->base;
> >> > +   const struct brw_stage_state *stage_state = &brw->gs.base;
> >> > +
> >> > +   if (active) {
> >> > +  /* FIXME: enable constant buffers */
> >> > +  BEGIN_BATCH(5);
> >> > +  OUT_BATCH(_3DSTATE_CONSTANT

Re: [Mesa-dev] [PATCH 02/37] i965/gen6/gs: refactor gen6_gs_state

2014-09-04 Thread Iago Toral Quiroga
On mié, 2014-09-03 at 18:51 -0700, Jordan Justen wrote:
> Rather than:
> i965/gen6/gs: refactor gen6_gs_state
> 
> How about something like:
> i965/gen6/gs: Skeleton for user GS program support
> 
> (more below)
> 
> On Thu, Aug 14, 2014 at 4:11 AM, Iago Toral Quiroga  wrote:
> > From: Samuel Iglesias Gonsalvez 
> >
> > Currently, gen6 only uses geometry shaders for transform feedback so the 
> > state
> > we emit is not suitable to accomodate general purpose, user-provided 
> > geometry
> > shaders. This patch paves the way to add these support and the needed
> > 3DSTATE_GS packet modifications for it.
> >
> > Previous code that emitted state to implement transform feedback in gen6 
> > goes
> > to upload_gs_state_adhoc_tf().
> >
> > Signed-off-by: Samuel Iglesias Gonsalvez 
> > ---
> >  src/mesa/drivers/dri/i965/gen6_gs_state.c | 105 
> > ++
> >  1 file changed, 94 insertions(+), 11 deletions(-)
> >
> > diff --git a/src/mesa/drivers/dri/i965/gen6_gs_state.c 
> > b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > index 9648fb7..e132959 100644
> > --- a/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > +++ b/src/mesa/drivers/dri/i965/gen6_gs_state.c
> > @@ -31,7 +31,7 @@
> >  #include "intel_batchbuffer.h"
> >
> >  static void
> > -upload_gs_state(struct brw_context *brw)
> > +upload_gs_state_for_tf(struct brw_context *brw)
> >  {
> > /* Disable all the constant buffers. */
> > BEGIN_BATCH(5);
> > @@ -49,11 +49,11 @@ upload_gs_state(struct brw_context *brw)
> >OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE);
> >OUT_BATCH(0); /* no scratch space */
> >OUT_BATCH((2 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> > -   (brw->ff_gs.prog_data->urb_read_length << 
> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> > +(brw->ff_gs.prog_data->urb_read_length << 
> > GEN6_GS_URB_READ_LENGTH_SHIFT));
> >OUT_BATCH(((brw->max_gs_threads - 1) << GEN6_GS_MAX_THREADS_SHIFT) |
> > -   GEN6_GS_STATISTICS_ENABLE |
> > -   GEN6_GS_SO_STATISTICS_ENABLE |
> > -   GEN6_GS_RENDERING_ENABLE);
> > +GEN6_GS_STATISTICS_ENABLE |
> > +GEN6_GS_SO_STATISTICS_ENABLE |
> > +GEN6_GS_RENDERING_ENABLE);
> 
> This looks like tabs to spaces conversion. For lines that need to be
> changed, it is good to do that conversion. But, in this case, the only
> change is the name of the function.
> 
> >OUT_BATCH(GEN6_GS_SVBI_PAYLOAD_ENABLE |
> >  GEN6_GS_SVBI_POSTINCREMENT_ENABLE |
> >  (brw->ff_gs.prog_data->svbi_postincrement_value <<
> > @@ -65,24 +65,107 @@ upload_gs_state(struct brw_context *brw)
> >OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> >OUT_BATCH(0); /* prog_bo */
> >OUT_BATCH((0 << GEN6_GS_SAMPLER_COUNT_SHIFT) |
> > -   (0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> > +(0 << GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
> >OUT_BATCH(0); /* scratch space base offset */
> >OUT_BATCH((1 << GEN6_GS_DISPATCH_START_GRF_SHIFT) |
> > -   (0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> > -   (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> > +(0 << GEN6_GS_URB_READ_LENGTH_SHIFT) |
> > +(0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT));
> >OUT_BATCH((0 << GEN6_GS_MAX_THREADS_SHIFT) |
> > -   GEN6_GS_STATISTICS_ENABLE |
> > -   GEN6_GS_RENDERING_ENABLE);
> > +GEN6_GS_STATISTICS_ENABLE |
> > +GEN6_GS_RENDERING_ENABLE);
> > +  OUT_BATCH(0);
> > +  ADVANCE_BATCH();
> > +   }
> > +}
> > +
> > +static void
> > +upload_gs_state(struct brw_context *brw)
> > +{
> > +   /* BRW_NEW_GEOMETRY_PROGRAM */
> > +   bool active = brw->geometry_program;
> > +   /* CACHE_NEW_GS_PROG */
> > +   const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
> > +   const struct brw_stage_state *stage_state = &brw->gs.base;
> > +
> > +   if (active) {
> > +  /* FIXME: enable constant buffers */
> > +  BEGIN_BATCH(5);
> > +  OUT_BATCH(_3DSTATE_CONSTANT_GS << 16 | (5 - 2));
> > +  OUT_BATCH(0);
> > +  OUT_BATCH(0);
> >OUT_BATCH(0);
> > +  OUT_BATCH(0);
> > +  ADVANCE_BATCH();
> > +
> > +  BEGIN_BATCH(7);
> > +  OUT_BATCH(_3DSTATE_GS << 16 | (7 - 2));
> > +  OUT_BATCH(stage_state->prog_offset);
> > +
> > +  /* GEN6_GS_SPF_MODE and GEN6_GS_VECTOR_MASK_ENABLE are enabled as it
> > +   * was previously done for gen6.
> > +   *
> > +   * TODO: test with both disabled to see if the HW is behaving
> > +   * as expected, like in gen7.
> > +   */
> > +  OUT_BATCH(GEN6_GS_SPF_MODE | GEN6_GS_VECTOR_MASK_ENABLE |
> > +((ALIGN(stage_state->sampler_count, 4)/4) <<
> > + GEN6_GS_SAMPLER_COUNT_SHIFT) |
> > +((prog_data->base.binding_table.size_bytes / 4) <<
> > + GEN6_GS