Hello,
I am trying to set up an Amanda backup for the first time, and I have
the problem, that nearly always one of the filesystem backups fails.
It does not always fail for the same host, but always for a different
one.
I have nothing about something like this in the FAQ, but Ryan Williams
reported something similar in the mailing list. For him ist was a
problem with autosensing media of the ethernet card.
Next thing I will try is to set the autosensing ethernet cards to a
fixed speed.
SYMPTOMS:
In the amanda mail report, the error is described as:
-------------------------------------------------------------------------------
...
FAILURE AND STRANGE DUMP SUMMARY:
wasa c0t0d0s4 lev 1 FAILED [mesg read: Connection reset by peer]
...
FAILED AND STRANGE DUMP DETAILS:
/-- wasa c0t0d0s4 lev 1 FAILED [mesg read: Connection reset by peer]
\--------
...
wasa c0t0d0s4 1 FAILED ---------------------------------------
...
(brought to you by Amanda version 2.4.2p2)
-------------------------------------------------------------------------------
On the affected host the /tmp/amanda/sendbackup.XXX.debug reads:
-------------------------------------------------------------------------------
sendbackup: debug 1 pid 4427 ruid 81 euid 81 start time Wed Jun 6 14:51:16 2001
/opt/amanda/libexec/sendbackup: version 2.4.2p2
sendbackup: got input request: DUMP c0t0d0s4 1 2001:6:5:10:59:44 OPTIONS |;bsd-a
uth;compress-fast;no-record;
parsed request as: program `DUMP'
disk `c0t0d0s4'
lev 1
since 2001:6:5:10:59:44
opt `|;bsd-auth;compress-fast;no-record;'
sendbackup: try_socksize: send buffer size is 65536
sendbackup: stream_server: waiting for connection: 0.0.0.0.40295
sendbackup: stream_server: waiting for connection: 0.0.0.0.40296
waiting for connect on 40295, then 40296
sendbackup: stream_accept: connection from 193.98.1.247.1309
sendbackup: stream_accept: timeout after 120 seconds
sendbackup: timeout on mesg port 40296
sendbackup: pid 4427 finish time Wed Jun 6 14:53:16 2001
-------------------------------------------------------------------------------
This used to be ``sendbackup: stream_accept: timeout after 30 seconds'',
but I have tried to circumvent the problem by editing
client-src/sendbackup.c:
-------------------------------------------------------------------------------
--- client-src/sendbackup.c.dist Thu Mar 15 03:17:36 2001
+++ client-src/sendbackup.c Wed Jun 6 14:12:42 2001
@@ -37,7 +37,7 @@
#include "getfsent.h"
#include "version.h"
-#define TIMEOUT 30
+#define TIMEOUT 120
int comppid = -1;
int dumppid = -1;
-------------------------------------------------------------------------------
CONFIGURATION:
- amanda v2.4.2p2, compiled by me.
- backup server: SuSE Linux 7.0 (i386), linux 2.4.2
Pentium II,
128 MB RAM,
2 SCSI Disks IBM DDYS-T36950N,
1 HP surestore BNCHMARK DLT1
Ethernet controller: 3Com Corporation 3c905C-TX [Fast Etherlink]
diff example/config.site /opt/amanda/etc/config.site
74a75,76
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
121a124
> DEFAULT_SERVER=backup.asys-h.de
147a151
> CLIENT_LOGIN=amanda
153a158
> SETUID_GROUP=disk
177a183
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a228
> USE_FQDN=yes
381a389
> DEBUGGING=/var/amanda/debug
426a435
> with_gnu_ld=yes
the stripped amanda.conf
-------------------------------------------------------------------------------
org "Extern"
mailto "[EMAIL PROTECTED]"
dumpuser "amanda"
inparallel 4
netusage 600 Kbps
dumpcycle 1 weeks
runspercycle 5
tapecycle 8 tapes
bumpsize 20 Mb
bumpdays 1
bumpmult 4
etimeout 300
dtimeout 1800
ctimeout 30
tapebufs 20
runtapes 1
tpchanger "chg-manual"
tapedev "/dev/nst0"
rawtapedev "/dev/null"
changerfile "/opt/amanda/etc/extern/changer.conf"
changerdev "/dev/null"
tapetype DLT1
labelstr "^Extern[0-9][0-9]*$"
holdingdisk hd1 {
comment "main holding disk"
directory "/dumps/amanda"
use -1 Mb
chunksize 1Gb
}
reserve 30
infofile "/logs/amanda/Extern/curinfo"
logdir "/logs/amanda/Extern"
indexdir "/logs/amanda/Extern/index"
define tapetype DLT1 {
comment "just produced by tapetype program"
length 34608 mbytes
filemark 21 kbytes
speed 1414 kps
}
define dumptype global {
comment "Global definitions"
record no
}
define dumptype always-full {
global
comment "Full dump of this filesystem always"
compress none
priority high
dumpcycle 0
}
define dumptype root-tar {
global
program "GNUTAR"
comment "root partitions dumped with tar"
compress none
index
exclude list "/usr/local/lib/amanda/exclude.gtar"
priority low
}
define dumptype user-tar {
root-tar
comment "user partitions dumped with tar"
priority medium
}
define dumptype comp-root-tar {
root-tar
comment "Root partitions with compression"
compress client fast
}
define dumptype comp-user-tar {
user-tar
compress client fast
}
define dumptype holding-disk {
global
comment "The master-host holding disk itself"
holdingdisk no
priority medium
}
define dumptype comp-user {
global
comment "Non-root partitions on reasonably fast machines"
compress client fast
priority medium
}
define dumptype nocomp-user {
comp-user
comment "Non-root partitions on slow machines"
compress none
}
define dumptype scomp-user {
comp-user
comment "Non-root partitions on slow machines"
compress server fast
}
define dumptype comp-root {
global
comment "Root partitions with compression"
compress client fast
priority low
}
define dumptype nocomp-root {
comp-root
comment "Root partitions without compression"
compress none
}
define dumptype scomp-root {
comp-root
comment "Root partitions with server compression"
compress server fast
}
define interface local {
comment "a local disk"
use 1000 kbps
}
define interface le0 {
comment "10 Mbps ethernet"
use 400 kbps
}
define interface hme0 {
comment "100 Mbps ethernet"
use 4000 kbps
}
-------------------------------------------------------------------------------
- backup clients: various Solaris 2.6 clients
Sun Ultra 1/140, 1/170, 1/170E
Sun Sparc Station 10
diff example/config.site /opt/amanda/etc/config.site
58a59
> INCLUDE_DIRS="/opt/gnu/include"
74a76,77
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
96a100
> NO_SERVER_MODE=true
121a126
> DEFAULT_SERVER=backup.asys-h.de
147a153
> CLIENT_LOGIN=amanda
153a160
> SETUID_GROUP=disk
177a185
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a230
> USE_FQDN=yes
381a391
> DEBUGGING=/var/amanda/debug
426a437
> with_gnu_ld=no
- backup clients: various SuSE versions
various PCs
diff example/config.site /opt/amanda/etc/config.site
74a75,76
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
96a99
> NO_SERVER_MODE=true
121a125
> DEFAULT_SERVER=backup.asys-h.de
147a152
> CLIENT_LOGIN=amanda
153a159
> SETUID_GROUP=disk
177a184
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a229
> USE_FQDN=yes
381a390
> DEBUGGING=/var/amanda/debug
426a436
> with_gnu_ld=yes
Regards
Andreas