---
 src/gallium/drivers/r600/evergreen_compute.c |   30 +++++++++++++------------
 1 files changed, 16 insertions(+), 14 deletions(-)

diff --git a/src/gallium/drivers/r600/evergreen_compute.c 
b/src/gallium/drivers/r600/evergreen_compute.c
index eaffb75..3ec9d9b 100644
--- a/src/gallium/drivers/r600/evergreen_compute.c
+++ b/src/gallium/drivers/r600/evergreen_compute.c
@@ -188,20 +188,6 @@ static void evergreen_bind_compute_state(struct 
pipe_context *ctx_, void *state)
 
        r600_inval_shader_cache(ctx);
 
-       /* We can't always determine the
-        * number of iterations in a loop before it's executed,
-        * so we just need to set up the loop counter to give us the maximum
-        * number of iterations possible.  Currently, loops in shader code
-        * ignore the loop counter and use a break instruction to exit the
-        * loop at the correct time.
-        */
-       evergreen_set_loop_const(ctx->cs_shader,
-               0, /* index */
-               0xFFF, /* Maximum value of the loop counter (i.e. when the loop
-                       * counter reaches this value, the program will break
-                       * out of the loop. */
-               0x0,   /* Starting value of the loop counter. */
-               0x1);  /* Amount to increment the loop counter each iteration. 
*/
 }
 
 /* The kernel parameters are stored a vtx buffer (ID=0), besides the explicit
@@ -674,6 +660,22 @@ void evergreen_init_atom_start_compute_cs(struct 
r600_context *ctx)
                                                | S_0286E8_TGID_ENA
                                                | S_0286E8_DISABLE_INDEX_PACK)
                                                ;
+
+       /* The LOOP_CONST registers are an optimizations for loops that allows
+        * you to store the initial counter, increment value, and maximum
+        * counter value in a register so that hardware can calculate the
+        * correct number of iterations for the loop, so that you don't need
+        * to have the loop counter in your shader code.  We don't currently use
+        * this optimization, so we must keep track of the counter in the
+        * shader and use a break instruction to exit loops.  However, the
+        * hardware will still uses this register to determine when to exit a
+        * loop, so we need to initialize the counter to 0, set the increment
+        * value to 1 and the maximum counter value to the 4095 (0xfff) which
+        * is the maximum value allowed.  This gives us a maximum of 4096
+        * iterations for our loops, but hopefully our break instruction will
+        * execute before some time before the 4096th iteration.
+        */
+       eg_store_loop_const(cb, R_03A200_SQ_LOOP_CONST_0 + (160 * 4), 
0x1000FFF);
 }
 
 void evergreen_init_compute_state_functions(struct r600_context *ctx)
-- 
1.7.7.6

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
http://lists.freedesktop.org/mailman/listinfo/mesa-dev

Reply via email to