Still getting a generator hang on 2.6.7

Steve Sether steve at vellmont.com
Wed Mar 15 17:41:26 GMT 2006


I've gotten around to testing the generator hang bug using stunnel
under 2.6.7, and I still occasionally get the same problem.  It
seems to be around 50% of the time.  Here's some strace output from the
generator and receiver from two runs, one where the generator exits
properly, and one where it doesn't.  Run 2 hangs indefinately.

Run 1

Generator:

Process 14581 attached - interrupt to quit
select(5, NULL, [4], NULL, {41, 810000}) = 0 (Timeout)
select(5, NULL, [4], NULL, {60, 0})     = 0 (Timeout)
select(5, NULL, [4], NULL, {60, 0})     = 1 (out [4], left {36, 700000})
write(4, "\0\0\0\0\0\0\0\0\0\0\0\0000B\0\0\0\240\0\0\0\0\0\0\0\0"..., 4092) = -1 ECONNRESET (Connection reset by peer)
getpid()                                = 14581
time(NULL)                              = 1142443238
write(3, "2006/03/15 11:20:38 [14581] rsyn"..., 142) = 142
rt_sigaction(SIGUSR1, {SIG_IGN}, NULL, 8) = 0
rt_sigaction(SIGUSR2, {SIG_IGN}, NULL, 8) = 0
getpid()                                = 14581
kill(14582, SIGUSR1)                    = 0
getpid()                                = 14581
time(NULL)                              = 1142443238
write(3, "2006/03/15 11:20:38 [14581] rsyn"..., 113) = 113
munmap(0x40018000, 4096)                = 0
_exit(12)                               = ?
Process 14581 detached

Receiver:
read(4, "IX\2444\216\243\365\26\222A\311\277\327\336d\375\336v\210"..., 8184) = 8184
time(NULL)                              = 1142443237
write(5, "\236/os\367&\330\237\6\25\njH\37\267\256~{\307\273i\27"..., 1024) = 1024
write(5, "\35\300,\305N\267\232v\343#\34\226\n\177\26\20\265J\r\t"..., 1024) = 1024
write(5, "K\16\377\0mE\260\274\230\351\0271\327\375\300\271z\177"..., 1024) = 1024
write(5, "\356$\306*\321MI:\325,\270\215\247D\271<\6\35\204\210\254"..., 1024) = 1024
write(5, "\217Ym\354\216\372\321]\355o\342Q\225\327\362\241\352\215"..., 1024) = 1024
write(5, "}R>N\246\263\177\357\r\363S\35|\264\311\10\305\365\375"..., 1024) = 1024
write(5, "\222\30\243-\303\215<\0369P\247\361nH\377\0\37x\245\315"..., 1024) = 1024
write(5, "2\260\300\245\332\337\304\377\0D\235\336K\251W\f\350\205"..., 1024) = 1024
write(5, "K\330\307\6\274\17\227Aob\374r\241\317R}\3341<S\210\274"..., 1024) = 1024
write(5, "\215\34\353\364&\334{\313On~\362\\\271\315V0m\\\315\22"..., 1024) = 1024
write(5, "$\243\n\307I\374\315A\3\34\30\nt[;\223\36r\273O\356\331"..., 1024) = 1024
write(5, "\216\215\266\346+sV\356\223+3\375\355^r\267o\320b I\22"..., 1024) = 1024
write(5, "\372\360S$\365${y!]\3360\17\21\376\257\360\365g\2753XW"..., 1024) = 1024
write(5, "\265\344\216D\344\250e\346\17w9\255/o\253_\246\211\330"..., 1024) = 1024
write(5, "\324\375\242\235e\307\335\312B\334\247\265O^\21!?\221\257"..., 1024) = 1024
write(5, "\240{{l*\r\325H\365\224\21E(x\316\244\322\241\203\33\336"..., 1017) = 1017
select(5, [4], [], NULL, {60, 0})       = 1 (in [4], left {60, 0})
read(4, "g!\230\315T,\224\247iu\356[\37\220\373\t\37R\201\275{h"..., 8184) = 8184
time(NULL)                              = 1142443237
select(5, [4], [], NULL, {60, 0})       = 1 (in [4], left {60, 0})
read(4, "\307\252S\200)\320c\237f\216+%\333\255e\244", 8184) = 16
time(NULL)                              = 1142443237
select(5, [4], [], NULL, {60, 0})       = 1 (in [4], left {59, 640000})
read(4, "+R\307\324\377\0\230ui=?\205\251\254Z\n\214\203x\351AF"..., 8184) = 8184
time(NULL)                              = 1142443238
write(5, "\221I\256\247=d\207+[\272\370t\341A\321\35\354\254\213"..., 1024) = 1024
write(5, "j\215GN\306\306AT\314|\354N\233\351\20*\205\344[\2369\367"..., 1024) = 1024
write(5, "\374h\236\203\234\231h/7!r\23\261\344\24\377\0J0\277\310"..., 1024) = 1024
--- SIGUSR1 (User defined signal 1) @ 0 (0) ---
Process 14582 detached




Run 2

Generator:

Process 14662 attached - interrupt to quit
select(5, NULL, [4], NULL, {56, 90000}) = ? ERESTARTNOHAND (To be restarted)
--- SIGCHLD (Child exited) @ 0 (0) ---
wait4(-1, [WIFEXITED(s) && WEXITSTATUS(s) == 12], WNOHANG, NULL) = 14670
wait4(-1, 0xbffe68d4, WNOHANG, NULL)    = -1 ECHILD (No child processes)
sigreturn()                             = ? (mask now [])
select(5, NULL, [4], NULL, {60, 0})     = 0 (Timeout)
select(5, NULL, [4], NULL, {60, 0})     = 0 (Timeout)
select(5, NULL, [4], NULL, {60, 0}


Receiver:
write(5, "\365P\3\346\245\217\215\20\373\30\265>R/\247\\\206.\237"..., 1024) = 1024
write(5, "\314\314\27\375\207\264\247a\345\370\to\6:\375\237\354"..., 1024) = 1024
write(5, "\244\376D\203\326\\T[\337n0|6{#B\3\26\3614\242\252\234"..., 1024) = 1024
write(5, "T0\250?h>c\310\361\363\4t\264\330=\323W\210\232<.\371\21"..., 1024) = 1024
write(5, "t\270\334\2577\33\211ef\313\32g\313\256\35\211\0166\252"..., 1024) = 1024
write(5, "\325\332\360\343w\0356~\205V\232\217z\4\307Jc\"\32zM\365"..., 1024) = 1024
write(5, "/I\3\3\364\v\31#\375W\263\30\371s\230&r^5\205\177\247\""..., 1024) = 1024
write(5, "\254@\275\340e\344\333R\26\215\207\365\0/\34\375=\260\334"..., 1024) = 1024
write(5, ">!\220O\364\300\311\257\361\0\31\177\321\24\374]B\367\226"..., 1024) = 1024
write(5, "|\353\325\367\21\244\n\216=\v\273x\37\"\363cp\17\327\353"..., 1024) = 1024
write(5, "YX\202B(\37RH\376\237A\356C\264\2242\353>\235D\327\320"..., 1024) = 1024
write(5, "\350\332.X\207\312\244\217\341\25\376|?\237^\245\334\333"..., 1024) = 1024
write(5, "\36Z\243\32\217\310W\247,\317q\354\314\35\25\5^U\367&6"..., 1024) = 1024
write(5, "\31)\336\302\343\\M\34\234\222M\223|\3349R\350h\253\330"..., 1024) = 1024
write(5, "+\31mV\312\344\322\367\275\300\254\233\353\315\227\351"..., 1024) = 1024
write(5, "\17\4Mo\317\264\334\327i\343l\366\273\234C\374b\312\340"..., 1018) = 1018
write(5, "\374G\333\t\10;\247s\356\214\344\305\211x\251\352\227\v"..., 149) = 149
select(5, [4], [], NULL, {60, 0})       = 1 (in [4], left {60, 0})
read(4, "m\356\261.\357\f\2767\217\2535\322\325\322~T", 8184) = 16
time(NULL)                              = 1142443576
select(5, [4], [], NULL, {60, 0})       = 1 (in [4], left {59, 830000})
read(4, 0x8099c98, 8184)                = -1 ECONNRESET (Connection reset by peer)
write(6, "2\0\0\rrsync: read error: Connectio"..., 54) = 54
rt_sigaction(SIGUSR1, {SIG_IGN}, NULL, 8) = 0
rt_sigaction(SIGUSR2, {SIG_IGN}, NULL, 8) = 0
write(6, "S\0\0\10rsync error: error in rsync "..., 87) = 87
munmap(0x40018000, 4096)                = 0
_exit(12)                               = ?
Process 14670 detached


More information about the rsync mailing list