Marc Haber said at 01/03/2007 10:08:
On Thu, Mar 01, 2007 at 09:50:40AM +0000, Ronny Adsetts wrote:Marc Haber said at 01/03/2007 09:13:On Wed, Feb 28, 2007 at 07:43:16PM +0000, Ronny Adsetts wrote:My first thought was hardware failure too, but it's not looking that way at the moment. The segfaults are too regular in their timing. I'll see if the same happens at 20:08.What does your exim log say in the respective time frame?Nothing for the email in the tcpdump gets logged to any of the exim logs AFAICS.I'm not seeing any problems on this server at all other than this segfault that started yesterday at ~3am and continues every hour when the same email is retried.So it is an incoming message? Can you strace -f your exim daemon in the time frame where you expect the retry to happen?
Strace for the crashing process attached. Command was: $ sudo strace -ff -o exim_strace /usr/sbin/exim4 -bd -q30m -oX 587:465:25 -oP /var/run/exim4/exim.pid Segfault log: Mar 1 11:09:16 nakor kernel: exim4[17576]: segfault at 0000000000000000 rip 0000002a96bbb220 rsp 0000007fbfffd758 error 4
Does this also happen when you use a backport of a more recent exim version?
I'll see if I can give it a go in a little while... it's the office mail server so have to a little careful. :-)
I'll send a heads-up to the GnuTLS guys.
Not sure from the strace that that's where the problem is... but then I'm not much of an strace guru. Let me know if there's anything else I can do. I'll let you know in a while, if I can, whether the current backports.org exim (4.63-17~bpo.1) crashes. Ronny -- Ronny Adsetts Technical Director Amazing Internet Ltd, London t: +44 20 8607 9535 f: +44 20 8607 9536 w: www.amazinginternet.com
getsockname(9, {sa_family=AF_INET, sin_port=htons(48945), sin_addr=inet_addr("172.16.1.20")}, [38654705680]) = 0 getpeername(9, 0x7fbfffd8e0, [68719476864]) = -1 ENOTCONN (Transport endpoint is not connected) close(3) = 0 close(4) = 0 close(5) = 0 close(6) = 0 close(7) = 0 close(8) = 0 rt_sigaction(SIGCHLD, {SIG_IGN}, NULL, 8) = 0 setsockopt(10, SOL_SOCKET, SO_KEEPALIVE, [1], 4) = 0 socket(PF_INET, SOCK_DGRAM, IPPROTO_IP) = 3 connect(3, {sa_family=AF_INET, sin_port=htons(53), sin_addr=inet_addr("172.16.1.20")}, 28) = 0 sendto(3, "c*\1\0\0\1\0\0\0\0\0\0\00219\00279\003179\00264\7in-ad"..., 43, 0, NULL, 0) = 43 gettimeofday({1172747355, 836759}, NULL) = 0 poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 5000) = 1 recvfrom(3, "c*\201\200\0\1\0\1\0\3\0\2\00219\00279\003179\00264\7i"..., 2048, 0, {sa_family=AF_INET, sin_port=htons(53), sin_addr=inet_addr("172.16.1.20")}, [16]) = 182 close(3) = 0 socket(PF_FILE, SOCK_STREAM, 0) = 3 connect(3, {sa_family=AF_FILE, path="/var/run/.nscd_socket"}, 110) = 0 writev(3, [{"\2\0\0\0\5\0\0\0\33\0\0\0", 12}, {"mail.griffinautomation.com\0", 27}], 2) = 39 read(3, "\2\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\377\377\377\377\377\377"..., 32) = 32 close(3) = 0 socket(PF_FILE, SOCK_STREAM, 0) = 3 connect(3, {sa_family=AF_FILE, path="/var/run/.nscd_socket"}, 110) = 0 writev(3, [{"\2\0\0\0\4\0\0\0\33\0\0\0", 12}, {"mail.griffinautomation.com\0", 27}], 2) = 39 read(3, "\2\0\0\0\1\0\0\0\33\0\0\0\0\0\0\0\2\0\0\0\4\0\0\0\1\0\0"..., 32) = 32 readv(3, [{"mail.griffinautomation.com\0", 27}, {"", 0}, {"@\263O\23", 4}], 3) = 31 read(3, NULL, 0) = 0 close(3) = 0 getpid() = 17576 time(NULL) = 1172747356 select(12, [11], NULL, NULL, {0, 0}) = 0 (Timeout) rt_sigaction(SIGTERM, {0x456200, [], 0x4000000}, NULL, 8) = 0 rt_sigaction(SIGALRM, {0x456170, [], 0x4000000}, NULL, 8) = 0 write(10, "220 nakor.amazing-internet.net E"..., 80) = 80 alarm(300) = 0 read(11, "EHLO mail.griffinautomation.com\r"..., 8192) = 33 alarm(0) = 300 rt_sigaction(SIGALRM, {0x425d50, [], 0x4000000}, NULL, 8) = 0 getpid() = 17576 rt_sigaction(SIGALRM, {0x456170, [], 0x4000000}, NULL, 8) = 0 write(10, "250-nakor.amazing-internet.net H"..., 139) = 139 alarm(300) = 0 read(11, "STARTTLS\r\n", 8192) = 10 alarm(0) = 300 rt_sigaction(SIGALRM, {0x425d50, [], 0x4000000}, NULL, 8) = 0 brk(0) = 0x5f4000 brk(0x615000) = 0x615000 brk(0) = 0x615000 brk(0x636000) = 0x636000 open("/var/spool/exim4/gnutls-params", O_RDONLY) = 3 read(3, "@\0\0\0", 4) = 4 read(3, "\334\311E\3\332\202)M\376+\20s\226\313|W\271\30\347\306"..., 64) = 64 read(3, "\3\0\0\0", 4) = 4 read(3, "\1\0\1", 3) = 3 read(3, "@\0\0\0", 4) = 4 read(3, ";oyCD\316\366d\227\20+\301\32.\224>\37G\213\231un\35W\367"..., 64) = 64 read(3, " \0\0\0", 4) = 4 read(3, "\346!\326\32\301\26\267\341\312\335\10\34\37\253\322\21"..., 32) = 32 read(3, " \0\0\0", 4) = 4 read(3, "\365\232\177\247\231\341\355\274\237D\33P}4\374?\334\303"..., 32) = 32 read(3, " \0\0\0", 4) = 4 read(3, "\365\205l;[EMAIL PROTECTED]"..., 32) = 32 read(3, "`\0\0\0", 4) = 4 read(3, "\263\311\354\30,e\275\373\233df\275\v\314M\217\17~\315"..., 96) = 96 read(3, "\1\0\0\0", 4) = 4 read(3, "\6", 1) = 1 close(3) = 0 open("/etc/ssl/private/nakor.amazing-internet.net-key.pem", O_RDONLY) = 3 fstat(3, {st_mode=S_IFREG|0640, st_size=3243, ...}) = 0 mmap(NULL, 3243, PROT_READ, MAP_SHARED, 3, 0) = 0x2a9556b000 close(3) = 0 munmap(0x2a9556b000, 3243) = 0 open("/etc/ssl/certs/nakor.amazing-internet.net-cert.pem", O_RDONLY) = 3 fstat(3, {st_mode=S_IFREG|0644, st_size=2894, ...}) = 0 mmap(NULL, 2894, PROT_READ, MAP_SHARED, 3, 0) = 0x2a9556b000 close(3) = 0 munmap(0x2a9556b000, 2894) = 0 stat("/etc/ssl/certs/AINet-cacert.pem", {st_mode=S_IFREG|0644, st_size=2642, ...}) = 0 open("/etc/ssl/certs/AINet-cacert.pem", O_RDONLY) = 3 fstat(3, {st_mode=S_IFREG|0644, st_size=2642, ...}) = 0 mmap(NULL, 2642, PROT_READ, MAP_SHARED, 3, 0) = 0x2a9556b000 close(3) = 0 munmap(0x2a9556b000, 2642) = 0 write(10, "220 TLS go ahead\r\n", 18) = 18 alarm(300) = 0 recvfrom(10, "\26\3\1\0A", 5, 0, NULL, NULL) = 5 recvfrom(10, "\1\0\0=\3\1E\346\266XY\325=\10:[EMAIL PROTECTED]"..., 65, 0, NULL, NULL) = 65 time(NULL) = 1172747356 getpid() = 17576 time(NULL) = 1172747356 getpid() = 17576 access("/dev/random", R_OK) = 0 access("/dev/urandom", R_OK) = 0 open("/dev/urandom", O_RDONLY) = 3 select(4, [3], NULL, NULL, {3, 0}) = 1 (in [3], left {3, 0}) read(3, "-\37a]j\v\212\341\354\346\374\352\204\274\272N\3\2\365"..., 120) = 120 select(4, [3], NULL, NULL, {3, 0}) = 1 (in [3], left {3, 0}) read(3, "\"\240\233Y#\360\244\374\366\27\331\27\365\216\225\203"..., 120) = 120 select(4, [3], NULL, NULL, {3, 0}) = 1 (in [3], left {3, 0}) read(3, "F\332h\276\266\367\23\347\261\2367\326\33\247\273\272m"..., 120) = 120 select(4, [3], NULL, NULL, {3, 0}) = 1 (in [3], left {3, 0}) read(3, "\214\247\244\271aK7\342G\326\25\30Jt\212\2773\1\365\334"..., 120) = 120 select(4, [3], NULL, NULL, {3, 0}) = 1 (in [3], left {3, 0}) read(3, "\220\'\6U\327\277\376\32\322\253\351\35&0xb\326A\257*,"..., 120) = 120 gettimeofday({1172747356, 474726}, NULL) = 0 getrusage(RUSAGE_SELF, {ru_utime={0, 10998}, ru_stime={0, 6998}, ...}) = 0 time(NULL) = 1172747356 times({tms_utime=1, tms_stime=0, tms_cutime=0, tms_cstime=0}) = 1066672212 getpid() = 17576 time(NULL) = 1172747356 sendto(10, "\26\3\1\0J\2\0\0F\3\1E\346\264\\\256\t\tF\263Gi\226(\365"..., 79, 0, NULL, 0) = 79 sendto(10, "\26\3\1\10:\v\0\0106\0\0103\0\01000\202\10,0\202\6\24\240"..., 2111, 0, NULL, 0) = 2111 sendto(10, "\26\3\1\0\276\r\0\0\272\2\1\2\0\265\0\2630\201\2601\v0"..., 195, 0, NULL, 0) = 195 sendto(10, "\26\3\1\0\4\16\0\0\0", 9, 0, NULL, 0) = 9 recvfrom(10, "\26\3\1\0A", 5, 0, NULL, NULL) = 5 recvfrom(10, "\1\0\0=\3\1E\346\266XY\325=\10:[EMAIL PROTECTED]"..., 65, 0, NULL, NULL) = 65 time(NULL) = 1172747356 time(NULL) = 1172747356 --- SIGSEGV (Segmentation fault) @ 0 (0) ---
signature.asc
Description: OpenPGP digital signature