Hello,

I am trying to set up an Amanda backup for the first time, and I have
the problem, that nearly always one of the filesystem backups fails.
It does not always fail for the same host, but always for a different
one. 

I have nothing about something like this in the FAQ, but Ryan Williams
reported something similar in the mailing list. For him ist was a
problem with autosensing media of the ethernet card.

Next thing I will try is to set the autosensing ethernet cards to a
fixed speed.


SYMPTOMS:

In the amanda mail report, the error is described as:
-------------------------------------------------------------------------------
...
FAILURE AND STRANGE DUMP SUMMARY:
  wasa       c0t0d0s4 lev 1 FAILED [mesg read: Connection reset by peer]
...
FAILED AND STRANGE DUMP DETAILS:

/-- wasa       c0t0d0s4 lev 1 FAILED [mesg read: Connection reset by peer]
\--------
...
wasa         c0t0d0s4    1 FAILED ---------------------------------------
...
(brought to you by Amanda version 2.4.2p2)
-------------------------------------------------------------------------------

On the affected host the /tmp/amanda/sendbackup.XXX.debug reads:
-------------------------------------------------------------------------------
sendbackup: debug 1 pid 4427 ruid 81 euid 81 start time Wed Jun  6 14:51:16 2001
/opt/amanda/libexec/sendbackup: version 2.4.2p2
sendbackup: got input request: DUMP c0t0d0s4 1 2001:6:5:10:59:44 OPTIONS |;bsd-a
uth;compress-fast;no-record;
  parsed request as: program `DUMP'
                     disk `c0t0d0s4'
                     lev 1
                     since 2001:6:5:10:59:44
                     opt `|;bsd-auth;compress-fast;no-record;'
sendbackup: try_socksize: send buffer size is 65536
sendbackup: stream_server: waiting for connection: 0.0.0.0.40295
sendbackup: stream_server: waiting for connection: 0.0.0.0.40296
  waiting for connect on 40295, then 40296
sendbackup: stream_accept: connection from 193.98.1.247.1309
sendbackup: stream_accept: timeout after 120 seconds
sendbackup: timeout on mesg port 40296
sendbackup: pid 4427 finish time Wed Jun  6 14:53:16 2001
-------------------------------------------------------------------------------

This used to be ``sendbackup: stream_accept: timeout after 30 seconds'',
but I have tried to circumvent the problem by editing
client-src/sendbackup.c:

-------------------------------------------------------------------------------
--- client-src/sendbackup.c.dist        Thu Mar 15 03:17:36 2001
+++ client-src/sendbackup.c     Wed Jun  6 14:12:42 2001
@@ -37,7 +37,7 @@
 #include "getfsent.h"
 #include "version.h"
 
-#define TIMEOUT 30
+#define TIMEOUT 120
 
 int comppid = -1;
 int dumppid = -1;
-------------------------------------------------------------------------------


CONFIGURATION:

  - amanda v2.4.2p2, compiled by me.

  - backup server: SuSE Linux 7.0 (i386), linux 2.4.2
    Pentium II, 
    128 MB RAM, 
    2 SCSI Disks IBM DDYS-T36950N,
    1 HP surestore BNCHMARK DLT1
    Ethernet controller: 3Com Corporation 3c905C-TX [Fast Etherlink]

diff example/config.site /opt/amanda/etc/config.site
74a75,76
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
121a124
> DEFAULT_SERVER=backup.asys-h.de
147a151
> CLIENT_LOGIN=amanda
153a158
> SETUID_GROUP=disk
177a183
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a228
> USE_FQDN=yes
381a389
> DEBUGGING=/var/amanda/debug
426a435
> with_gnu_ld=yes


    the stripped amanda.conf
-------------------------------------------------------------------------------
org "Extern"
mailto "[EMAIL PROTECTED]"
dumpuser "amanda"
inparallel 4
netusage  600 Kbps
dumpcycle 1 weeks
runspercycle 5
tapecycle 8 tapes
bumpsize 20 Mb
bumpdays 1
bumpmult 4
etimeout 300
dtimeout 1800
ctimeout 30

tapebufs 20
runtapes 1
tpchanger "chg-manual"
tapedev "/dev/nst0"
rawtapedev "/dev/null"
changerfile "/opt/amanda/etc/extern/changer.conf"
changerdev "/dev/null"
tapetype DLT1
labelstr "^Extern[0-9][0-9]*$"

holdingdisk hd1 {
    comment "main holding disk"
    directory "/dumps/amanda"
    use -1 Mb
    chunksize 1Gb
}

reserve 30
infofile "/logs/amanda/Extern/curinfo"
logdir   "/logs/amanda/Extern"
indexdir "/logs/amanda/Extern/index"

define tapetype DLT1 {
    comment "just produced by tapetype program"
    length 34608 mbytes
    filemark 21 kbytes
    speed 1414 kps
}

define dumptype global {
    comment "Global definitions"
record no
}

define dumptype always-full {
    global
    comment "Full dump of this filesystem always"
    compress none
    priority high
    dumpcycle 0
}

define dumptype root-tar {
    global
    program "GNUTAR"
    comment "root partitions dumped with tar"
    compress none
    index
    exclude list "/usr/local/lib/amanda/exclude.gtar"
    priority low
}

define dumptype user-tar {
    root-tar
    comment "user partitions dumped with tar"
    priority medium
}

define dumptype comp-root-tar {
    root-tar
    comment "Root partitions with compression"
    compress client fast
}

define dumptype comp-user-tar {
    user-tar
    compress client fast
}

define dumptype holding-disk {
    global
    comment "The master-host holding disk itself"
    holdingdisk no
    priority medium
}

define dumptype comp-user {
    global
    comment "Non-root partitions on reasonably fast machines"
    compress client fast
    priority medium
}

define dumptype nocomp-user {
    comp-user
    comment "Non-root partitions on slow machines"
    compress none
}

define dumptype scomp-user {
    comp-user
    comment "Non-root partitions on slow machines"
    compress server fast
}

define dumptype comp-root {
    global
    comment "Root partitions with compression"
    compress client fast
    priority low
}

define dumptype nocomp-root {
    comp-root
    comment "Root partitions without compression"
    compress none
}

define dumptype scomp-root {
    comp-root
    comment "Root partitions with server compression"
    compress server fast
}

define interface local {
    comment "a local disk"
    use 1000 kbps
}

define interface le0 {
    comment "10 Mbps ethernet"
    use 400 kbps
}

define interface hme0 {
    comment "100 Mbps ethernet"
    use 4000 kbps
}
-------------------------------------------------------------------------------


  - backup clients: various Solaris 2.6 clients
    Sun Ultra 1/140, 1/170, 1/170E
    Sun Sparc Station 10

diff example/config.site /opt/amanda/etc/config.site
58a59
> INCLUDE_DIRS="/opt/gnu/include"
74a76,77
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
96a100
> NO_SERVER_MODE=true
121a126
> DEFAULT_SERVER=backup.asys-h.de
147a153
> CLIENT_LOGIN=amanda
153a160
> SETUID_GROUP=disk
177a185
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a230
> USE_FQDN=yes
381a391
> DEBUGGING=/var/amanda/debug
426a437
> with_gnu_ld=no


  - backup clients: various SuSE versions
    various PCs

diff example/config.site /opt/amanda/etc/config.site
74a75,76
> #CONFIG_DIR=/etc/amanda
> CONFIG_DIR=/opt/amanda/etc
96a99
> NO_SERVER_MODE=true
121a125
> DEFAULT_SERVER=backup.asys-h.de
147a152
> CLIENT_LOGIN=amanda
153a159
> SETUID_GROUP=disk
177a184
> DEFAULT_TAPE_SERVER=backup.asys-h.de
221a229
> USE_FQDN=yes
381a390
> DEBUGGING=/var/amanda/debug
426a436
> with_gnu_ld=yes



                                        Regards
                                                Andreas


Reply via email to