Bug 763276 (GLUSTER-1544)

Summary: Create fails when 1 server is down
Product: [Community] GlusterFS Reporter: Anush Shetty <anush>
Component: replicateAssignee: Pavan Vilas Sondur <pavan>
Status: CLOSED CURRENTRELEASE QA Contact:
Severity: high Docs Contact:
Priority: low    
Version: mainlineCC: gluster-bugs, vijay
Target Milestone: ---   
Target Release: ---   
Hardware: All   
OS: Linux   
Whiteboard:
Fixed In Version: Doc Type: Bug Fix
Doc Text:
Story Points: ---
Clone Of: Environment:
Last Closed: Type: ---
Regression: --- Mount Type: ---
Documentation: --- CRM:
Verified Versions: Category: ---
oVirt Team: --- RHEL 7.3 requirements from Atomic Host:
Cloudforms Team: --- Target Upstream Version:

Description Anush Shetty 2010-09-06 13:03:03 UTC
On a 2-subvolume replicate setup, when I bring one server down and create a file  it fails.

root@pitta:/mnt/gluster# strace touch dot
execve("/usr/bin/touch", ["touch", "dot"], [/* 36 vars */]) = 0
brk(0)                                  = 0x7c0000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f545adc5000
access("/etc/ld.so.nohwcap", F_OK)      = -1 ENOENT (No such file or directory)
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f545adc3000
access("/etc/ld.so.preload", R_OK)      = -1 ENOENT (No such file or directory)
open("/etc/ld.so.cache", O_RDONLY)      = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=115391, ...}) = 0
mmap(NULL, 115391, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545ada6000
close(3)                                = 0
access("/etc/ld.so.nohwcap", F_OK)      = -1 ENOENT (No such file or directory)
open("/lib/librt.so.1", O_RDONLY)       = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220!\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=31744, ...}) = 0
mmap(NULL, 2128848, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f545a9a0000
mprotect(0x7f545a9a7000, 2093056, PROT_NONE) = 0
mmap(0x7f545aba6000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x6000) = 0x7f545aba6000
close(3)                                = 0
access("/etc/ld.so.nohwcap", F_OK)      = -1 ENOENT (No such file or directory)
open("/lib/libc.so.6", O_RDONLY)        = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\320\353\1\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=1494408, ...}) = 0
mmap(NULL, 3602440, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f545a630000
mprotect(0x7f545a796000, 2097152, PROT_NONE) = 0
mmap(0x7f545a996000, 20480, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x166000) = 0x7f545a996000
mmap(0x7f545a99b000, 18440, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f545a99b000
close(3)                                = 0
access("/etc/ld.so.nohwcap", F_OK)      = -1 ENOENT (No such file or directory)
open("/lib/libpthread.so.0", O_RDONLY)  = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\340X\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=131174, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f545ada5000
mmap(NULL, 2208640, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f545a414000
mprotect(0x7f545a42b000, 2093056, PROT_NONE) = 0
mmap(0x7f545a62a000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x16000) = 0x7f545a62a000
mmap(0x7f545a62c000, 13184, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f545a62c000
close(3)                                = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f545ada4000
arch_prctl(ARCH_SET_FS, 0x7f545ada46f0) = 0
mprotect(0x7f545a62a000, 4096, PROT_READ) = 0
mprotect(0x7f545a996000, 16384, PROT_READ) = 0
mprotect(0x7f545aba6000, 4096, PROT_READ) = 0
mprotect(0x60d000, 4096, PROT_READ)     = 0
mprotect(0x7f545adc6000, 4096, PROT_READ) = 0
munmap(0x7f545ada6000, 115391)          = 0
set_tid_address(0x7f545ada47c0)         = 31675
set_robust_list(0x7f545ada47d0, 0x18)   = 0
futex(0x7fff00408f7c, FUTEX_WAKE_PRIVATE, 1) = 0
futex(0x7fff00408f7c, 0x189 /* FUTEX_??? */, 1, NULL, 7f545ada46f0) = -1 EAGAIN (Resource temporarily unavailable)
rt_sigaction(SIGRTMIN, {0x7f545a419760, [], SA_RESTORER|SA_SIGINFO, 0x7f545a423190}, NULL, 8) = 0
rt_sigaction(SIGRT_1, {0x7f545a4197f0, [], SA_RESTORER|SA_RESTART|SA_SIGINFO, 0x7f545a423190}, NULL, 8) = 0
rt_sigprocmask(SIG_UNBLOCK, [RTMIN RT_1], NULL, 8) = 0
getrlimit(RLIMIT_STACK, {rlim_cur=8192*1024, rlim_max=RLIM_INFINITY}) = 0
open("/usr/lib/locale/locale-archive", O_RDONLY) = -1 ENOENT (No such file or directory)
brk(0)                                  = 0x7c0000
brk(0x7e1000)                           = 0x7e1000
open("/usr/share/locale/locale.alias", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=2570, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f545adc2000
read(3, "# Locale name alias data base.\n#"..., 4096) = 2570
read(3, "", 4096)                       = 0
close(3)                                = 0
munmap(0x7f545adc2000, 4096)            = 0
open("/usr/lib/locale/en_IN/LC_IDENTIFICATION", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=458, ...}) = 0
mmap(NULL, 458, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adc2000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_MEASUREMENT", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=23, ...}) = 0
mmap(NULL, 23, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adc1000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_TELEPHONE", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=53, ...}) = 0
mmap(NULL, 53, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adc0000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_ADDRESS", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=103, ...}) = 0
mmap(NULL, 103, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adbf000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_NAME", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=72, ...}) = 0
mmap(NULL, 72, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adbe000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_PAPER", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=34, ...}) = 0
mmap(NULL, 34, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adbd000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_MESSAGES", O_RDONLY) = 3
fstat(3, {st_mode=S_IFDIR|0755, st_size=4096, ...}) = 0
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_MESSAGES/SYS_LC_MESSAGES", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=53, ...}) = 0
mmap(NULL, 53, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adbc000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_MONETARY", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=294, ...}) = 0
mmap(NULL, 294, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adbb000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_COLLATE", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=966938, ...}) = 0
mmap(NULL, 966938, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545acb7000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_TIME", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=2578, ...}) = 0
mmap(NULL, 2578, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adba000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_NUMERIC", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=54, ...}) = 0
mmap(NULL, 54, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545adb9000
close(3)                                = 0
open("/usr/lib/locale/en_IN/LC_CTYPE", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=256316, ...}) = 0
mmap(NULL, 256316, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f545ac78000
close(3)                                = 0
open("dot", O_WRONLY|O_CREAT|O_NOCTTY|O_NONBLOCK, 0666

Comment 1 Vijay Bellur 2010-09-06 13:38:21 UTC
PATCH: http://patches.gluster.com/patch/4597 in master (cluster/afr: Fix hang in create when one subvol is down.)