http://gcc.gnu.org/bugzilla/show_bug.cgi?id=55360



             Bug #: 55360

           Summary: [TileGX] Passing structure by value on stack

                    needlessly writes to and reads from memory

    Classification: Unclassified

           Product: gcc

           Version: 4.7.2

            Status: UNCONFIRMED

          Severity: enhancement

          Priority: P3

         Component: rtl-optimization

        AssignedTo: unassig...@gcc.gnu.org

        ReportedBy: colander...@gmail.com





#include <stdint.h>



struct bar { uint8_t a, b, c, d; };

struct bla { unsigned long a:8, b:8, c:8, d:8; };



uint64_t bar(struct bar);

uint64_t bla(struct bla);



uint64_t foo(uint8_t a, uint8_t b, uint8_t c, uint8_t d)

{ return bar((struct bar) { a, b, c, d }); }



uint64_t baz(uint8_t a, uint8_t b, uint8_t c, uint8_t d)

{ return bla((struct bla) { a, b, c, d }); }



when compiled with "gcc -Wall -std=gnu99 -O3 -S pbv.c" produces:



    .file    "pbv.c"

    .text

    .align 8

.global foo

    .type    foo, @function

foo:

.LFB0:

    .cfi_startproc

    {

    st    sp, lr

    .cfi_offset 55, 0

    move    r29, sp

    addi    r28, sp, -16

    }

    addi    sp, sp, -24

    .cfi_def_cfa_offset 24

    {

    st    r28, r29

    addi    r11, sp, 21

    addi    r10, sp, 20

    }

    {

    st1    r11, r1

    addi    r11, sp, 22

    }

    {

    st1    r11, r2

    addi    r11, sp, 23

    }

    {

    st1    r10, r0

    movei    r0, 0

    }

    st1    r11, r3

    ld4u    r10, r10

    {

    bfins    r0, r10, 0, 0+32-1

    jal    bar

    }

    addi    r29, sp, 24

    ld    lr, r29

    {



    addi    sp, sp, 24

    .cfi_restore 54

    .cfi_restore 55

    .cfi_def_cfa_offset 0

    jrp    lr

    }

    .cfi_endproc

.LFE0:

    .size    foo, .-foo

    .align 8

.global baz

    .type    baz, @function

baz:

.LFB1:

    .cfi_startproc

    {

    movei    r10, 0

    st    sp, lr

    .cfi_offset 55, 0

    move    r29, sp

    }

    {

    bfins    r10, r0, 0, 7

    addi    r28, sp, -8

    }

    {

    bfins    r10, r1, 8, 8+8-1

    addi    sp, sp, -16

    }

    .cfi_def_cfa_offset 16

    {

    bfins    r10, r2, 16, 16+8-1

    st    r28, r29

    }

    bfins    r10, r3, 24, 24+8-1

    {

    move    r0, r10

    jal    bla

    }

    addi    r29, sp, 16

    ld    lr, r29

    {



    addi    sp, sp, 16

    .cfi_restore 54

    .cfi_restore 55

    .cfi_def_cfa_offset 0

    jrp    lr

    }

    .cfi_endproc

.LFE1:

    .size    baz, .-baz

    .ident    "GCC: (GNU) 4.7.2"

    .section    .note.GNU-stack,"",@progbits



My expectation is that the foo and baz should compile identically, and should

use the bfins bit-arithmetic functions like baz does, rather than redundant

stores and loads to stack like foo does.



This is with a vanilla GCC 4.7.2 build on a Tilempower system (roughly CentOS

5.7).



The problem does not occur on Debian x86-64 with either GCC 4.4.6 or GCC 4.7.2.



Possibly related to http://gcc.gnu.org/bugzilla/show_bug.cgi?id=7061 (however

that case seems to be fixed in 4.7.2).

Reply via email to