https://gcc.gnu.org/bugzilla/show_bug.cgi?id=79425
Bug ID: 79425
Summary: Inline assembly getting clobbered in some case
Product: gcc
Version: 5.4.0
Status: UNCONFIRMED
Severity: normal
Priority: P3
Component: c++
Assignee: unassigned at gcc dot gnu.org
Reporter: mini at cs dot technion.ac.il
Target Milestone: ---
I am getting inline assembly code clobbered if I #include<algorithm>, it is the
1st code in the .text segment, AND I use -std=c++11
This is the INCORRECT behavior. As you can see, the label reg_in is gone:
$ gcc -v
Using built-in specs.
COLLECT_GCC=gcc
COLLECT_LTO_WRAPPER=/usr/lib/gcc/x86_64-linux-gnu/5/lto-wrapper
Target: x86_64-linux-gnu
Configured with: ../src/configure -v --with-pkgversion='Ubuntu
5.4.0-6ubuntu1~16.04.4' --with-bugurl=file:///usr/share/doc/gcc-5/README.Bugs
--enable-languages=c,ada,c++,java,go,d,fortran,objc,obj-c++ --prefix=/usr
--program-suffix=-5 --enable-shared --enable-linker-build-id
--libexecdir=/usr/lib --without-included-gettext --enable-threads=posix
--libdir=/usr/lib --enable-nls --with-sysroot=/ --enable-clocale=gnu
--enable-libstdcxx-debug --enable-libstdcxx-time=yes
--with-default-libstdcxx-abi=new --enable-gnu-unique-object
--disable-vtable-verify --enable-libmpx --enable-plugin --with-system-zlib
--disable-browser-plugin --enable-java-awt=gtk --enable-gtk-cairo
--with-java-home=/usr/lib/jvm/java-1.5.0-gcj-5-amd64/jre --enable-java-home
--with-jvm-root-dir=/usr/lib/jvm/java-1.5.0-gcj-5-amd64
--with-jvm-jar-dir=/usr/lib/jvm-exports/java-1.5.0-gcj-5-amd64
--with-arch-directory=amd64 --with-ecj-jar=/usr/share/java/eclipse-ecj.jar
--enable-objc-gc --enable-multiarch --disable-werror --with-arch-32=i686
--with-abi=m64 --with-multilib-list=m32,m64,mx32 --enable-multilib
--with-tune=generic --enable-checking=release --build=x86_64-linux-gnu
--host=x86_64-linux-gnu --target=x86_64-linux-gnu
Thread model: posix
gcc version 5.4.0 20160609 (Ubuntu 5.4.0-6ubuntu1~16.04.4)
$ cat prog.c
#include <algorithm>
//void foo(){}
__asm__ volatile ("reg_in: \n\t"
"pushf\n\t"
"push %rbp\n\t"
"mov %rsp,%rbp\n\t"
"push %rdi\n\t"
"push %rsi\n\t"
"push %rdx\n\t"
"push %rcx\n\t"
"push %r8 \n\t"
"push %r9 \n\t"
"push %rax\n\t"
);
int main(int argc, char *argv[])
{
}
$ g++ -std=c++11 prog.c
$ objdump -d a.out # I put here only partial output
00000000004004b0 <frame_dummy>:
4004b0: bf 20 0e 60 00 mov $0x600e20,%edi
4004b5: 48 83 3f 00 cmpq $0x0,(%rdi)
4004b9: 75 05 jne 4004c0 <frame_dummy+0x10>
4004bb: eb 93 jmp 400450 <register_tm_clones>
4004bd: 0f 1f 00 nopl (%rax)
4004c0: b8 00 00 00 00 mov $0x0,%eax
4004c5: 48 85 c0 test %rax,%rax
4004c8: 74 f1 je 4004bb <frame_dummy+0xb>
4004ca: 55 push %rbp
4004cb: 48 89 e5 mov %rsp,%rbp
4004ce: ff d0 callq *%rax
4004d0: 5d pop %rbp
4004d1: e9 7a ff ff ff jmpq 400450 <register_tm_clones>
00000000004004d6 <main>:
4004d6: 55 push %rbp
4004d7: 48 89 e5 mov %rsp,%rbp
4004da: 89 7d fc mov %edi,-0x4(%rbp)
4004dd: 48 89 75 f0 mov %rsi,-0x10(%rbp)
4004e1: b8 00 00 00 00 mov $0x0,%eax
4004e6: 5d pop %rbp
4004e7: c3 retq
4004e8: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
4004ef: 00
If I do 1 of the following, I get the correct result
1. uncomment void foo(){}
2. remove #include <algorithm>
The examples below, are of CORRECT behaviors. Here the label reg_in stays:
$ vi prog.c
$ g++ -std=c++11 prog.c
$ cat prog.c
#include <algorithm>
void foo(){}
__asm__ volatile ("reg_in: \n\t"
"pushf\n\t"
"push %rbp\n\t"
"mov %rsp,%rbp\n\t"
"push %rdi\n\t"
"push %rsi\n\t"
"push %rdx\n\t"
"push %rcx\n\t"
"push %r8 \n\t"
"push %r9 \n\t"
"push %rax\n\t"
);
int main(int argc, char *argv[])
{
}
$ objdump -d a.out # I put here only partial output
00000000004004b0 <frame_dummy>:
4004b0: bf 20 0e 60 00 mov $0x600e20,%edi
4004b5: 48 83 3f 00 cmpq $0x0,(%rdi)
4004b9: 75 05 jne 4004c0 <frame_dummy+0x10>
4004bb: eb 93 jmp 400450 <register_tm_clones>
4004bd: 0f 1f 00 nopl (%rax)
4004c0: b8 00 00 00 00 mov $0x0,%eax
4004c5: 48 85 c0 test %rax,%rax
4004c8: 74 f1 je 4004bb <frame_dummy+0xb>
4004ca: 55 push %rbp
4004cb: 48 89 e5 mov %rsp,%rbp
4004ce: ff d0 callq *%rax
4004d0: 5d pop %rbp
4004d1: e9 7a ff ff ff jmpq 400450 <register_tm_clones>
00000000004004d6 <_Z3foov>:
4004d6: 55 push %rbp
4004d7: 48 89 e5 mov %rsp,%rbp
4004da: 90 nop
4004db: 5d pop %rbp
4004dc: c3 retq
00000000004004dd <reg_in>:
4004dd: 9c pushfq
4004de: 55 push %rbp
4004df: 48 89 e5 mov %rsp,%rbp
4004e2: 57 push %rdi
4004e3: 56 push %rsi
4004e4: 52 push %rdx
4004e5: 51 push %rcx
4004e6: 41 50 push %r8
4004e8: 41 51 push %r9
4004ea: 50 push %rax
00000000004004eb <main>:
4004eb: 55 push %rbp
4004ec: 48 89 e5 mov %rsp,%rbp
4004ef: 89 7d fc mov %edi,-0x4(%rbp)
4004f2: 48 89 75 f0 mov %rsi,-0x10(%rbp)
4004f6: b8 00 00 00 00 mov $0x0,%eax
4004fb: 5d pop %rbp
4004fc: c3 retq
4004fd: 0f 1f 00 nopl (%rax)
$ vi prog.c
$ g++ -std=c++11 prog.c
$ cat prog.c
//#include <algorithm>
//void foo(){}
__asm__ volatile ("reg_in: \n\t"
"pushf\n\t"
"push %rbp\n\t"
"mov %rsp,%rbp\n\t"
"push %rdi\n\t"
"push %rsi\n\t"
"push %rdx\n\t"
"push %rcx\n\t"
"push %r8 \n\t"
"push %r9 \n\t"
"push %rax\n\t"
);
int main(int argc, char *argv[])
{
}
$ objdump -d a.out # I put here only partial output
00000000004004b0 <frame_dummy>:
4004b0: bf 20 0e 60 00 mov $0x600e20,%edi
4004b5: 48 83 3f 00 cmpq $0x0,(%rdi)
4004b9: 75 05 jne 4004c0 <frame_dummy+0x10>
4004bb: eb 93 jmp 400450 <register_tm_clones>
4004bd: 0f 1f 00 nopl (%rax)
4004c0: b8 00 00 00 00 mov $0x0,%eax
4004c5: 48 85 c0 test %rax,%rax
4004c8: 74 f1 je 4004bb <frame_dummy+0xb>
4004ca: 55 push %rbp
4004cb: 48 89 e5 mov %rsp,%rbp
4004ce: ff d0 callq *%rax
4004d0: 5d pop %rbp
4004d1: e9 7a ff ff ff jmpq 400450 <register_tm_clones>
00000000004004d6 <reg_in>:
4004d6: 9c pushfq
4004d7: 55 push %rbp
4004d8: 48 89 e5 mov %rsp,%rbp
4004db: 57 push %rdi
4004dc: 56 push %rsi
4004dd: 52 push %rdx
4004de: 51 push %rcx
4004df: 41 50 push %r8
4004e1: 41 51 push %r9
4004e3: 50 push %rax
00000000004004e4 <main>:
4004e4: 55 push %rbp
4004e5: 48 89 e5 mov %rsp,%rbp
4004e8: 89 7d fc mov %edi,-0x4(%rbp)
4004eb: 48 89 75 f0 mov %rsi,-0x10(%rbp)
4004ef: b8 00 00 00 00 mov $0x0,%eax
4004f4: 5d pop %rbp
4004f5: c3 retq
4004f6: 66 2e 0f 1f 84 00 00 nopw %cs:0x0(%rax,%rax,1)
4004fd: 00 00 00