rgmanager doesn't start

Xander

New Member
Apr 17, 2013
20
0
1
Hi all !

i have a problem can't start vm

Executing HA start for VM 100
Member balthazar trying to enable pvevm:100...Could not connect to resource group manager
TASK ERROR: command 'clusvcadm -e pvevm:100 -m host' failed: exit code 1


all i do is chage network parameters ip, gateway on both nodes

cluster working and nodes see each other


service rgmanager status
rgmanager is stopped




service rgmanager start
Starting Cluster Service Manager: [ OK ]

service rgmanager status
rgmanager is stopped



strace clusvcadm -e Apache
execve("/usr/sbin/clusvcadm", ["clusvcadm", "-e", "Apache"], [/* 16 vars */]) = 0
brk(0) = 0x1330000
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027d0000
access("/etc/ld.so.preload", R_OK) = -1 ENOENT (No such file or directory)
open("/etc/ld.so.cache", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=25185, ...}) = 0
mmap(NULL, 25185, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f99027c9000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
open("/usr/lib/libcman.so.3", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0P\24\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=18896, ...}) = 0
mmap(NULL, 2114192, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f99023b0000
mprotect(0x7f99023b4000, 2097152, PROT_NONE) = 0
mmap(0x7f99025b4000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x4000) = 0x7f99025b4000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
open("/lib/libpthread.so.0", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\360Y\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=131258, ...}) = 0
mmap(NULL, 2208640, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f9902194000
mprotect(0x7f99021ab000, 2093056, PROT_NONE) = 0
mmap(0x7f99023aa000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x16000) = 0x7f99023aa000
mmap(0x7f99023ac000, 13184, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f99023ac000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
open("/usr/lib/liblogthread.so.3", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220\16\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=9512, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027c8000
mmap(NULL, 2113288, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f9901f90000
mprotect(0x7f9901f92000, 2093056, PROT_NONE) = 0
mmap(0x7f9902191000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1000) = 0x7f9902191000
mmap(0x7f9902192000, 7944, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f9902192000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
open("/lib/libc.so.6", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\240\355\1\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=1437064, ...}) = 0
mmap(NULL, 3545160, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7f9901c2e000
mprotect(0x7f9901d87000, 2093056, PROT_NONE) = 0
mmap(0x7f9901f86000, 20480, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x158000) = 0x7f9901f86000
mmap(0x7f9901f8b000, 18504, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f9901f8b000
close(3) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027c7000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027c6000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027c5000
arch_prctl(ARCH_SET_FS, 0x7f99027c6700) = 0
mprotect(0x7f9901f86000, 16384, PROT_READ) = 0
mprotect(0x7f99023aa000, 4096, PROT_READ) = 0
mprotect(0x7f99027d2000, 4096, PROT_READ) = 0
munmap(0x7f99027c9000, 25185) = 0
set_tid_address(0x7f99027c69d0) = 8017
set_robust_list(0x7f99027c69e0, 0x18) = 0
futex(0x7fffbf029c0c, FUTEX_WAKE_PRIVATE, 1) = 0
futex(0x7fffbf029c0c, FUTEX_WAIT_BITSET_PRIVATE|FUTEX_CLOCK_REALTIME, 1, NULL, 7f99027c6700) = -1 EAGAIN (Resource temporarily unavailable)
rt_sigaction(SIGRTMIN, {0x7f9902199870, [], SA_RESTORER|SA_SIGINFO, 0x7f99021a2ff0}, NULL, 8) = 0
rt_sigaction(SIGRT_1, {0x7f9902199900, [], SA_RESTORER|SA_RESTART|SA_SIGINFO, 0x7f99021a2ff0}, NULL, 8) = 0
rt_sigprocmask(SIG_UNBLOCK, [RTMIN RT_1], NULL, 8) = 0
getrlimit(RLIMIT_STACK, {rlim_cur=8192*1024, rlim_max=RLIM_INFINITY}) = 0
rt_sigaction(SIGPIPE, {SIG_IGN, [PIPE], SA_RESTORER|SA_RESTART, 0x7f9901c60230}, {SIG_DFL, [], 0}, 8) = 0
brk(0) = 0x1330000
brk(0x1351000) = 0x1351000
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/cman_client"}, 110) = 0
open("/dev/zero", O_RDONLY) = 4
fcntl(4, F_SETFD, FD_CLOEXEC) = 0
writev(3, [{"NAMC\3\0\0\20\24\0\0\0\7\0\0\0\0\0\0\0", 20}], 1) = 20
recvfrom(3, "NAMCu\201\322\212\210\3\0\0\7\0\0@\0\0\0\0", 20, 0, NULL, NULL) = 20
read(3, "\2\0\0\0\270\1\0\0\1\0\0\0\1\0\0\0\0\0\0\0004\0\0\0\2\0\0\0balt"..., 884) = 884
writev(3, [{"NAMC\3\0\0\20\24\0\0\0\7\0\0\0\0\0\0\0", 20}], 1) = 20
recvfrom(3, "NAMCu\201\322\212\210\3\0\0\7\0\0@\0\0\0\0", 20, 0, NULL, NULL) = 20
read(3, "\2\0\0\0\270\1\0\0\1\0\0\0\1\0\0\0\0\0\0\0004\0\0\0\2\0\0\0balt"..., 884) = 884
writev(3, [{"NAMC\3\0\0\20\314\1\0\0\220\0\0\0\0\0\0\0", 20}, {"h\227\2\277\0\0\0\0(A}\2\231\177\0\0(\24\366\367\0\0\0\0\0\0\0\0\0\0\0\0"..., 440}], 2) = 460
recvfrom(3, "NAMCu\201\322\212\320\1\0\0\220\0\0@\0\0\0\0", 20, 0, NULL, NULL) = 20
read(3, "\0\0\0\0\270\1\0\0\1\0\0\0\1\0\0\0\0\0\0\0004\0\0\0\2\0\0\0balt"..., 444) = 444
fstat(1, {st_mode=S_IFCHR|0620, st_rdev=makedev(136, 0), ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7f99027cf000
write(1, "Local machine trying to enable s"..., 48Local machine trying to enable service:Apache...) = 48
socket(PF_FILE, SOCK_STREAM, 0) = 5
connect(5, {sa_family=AF_FILE, path="/var/run/cluster/rgmanager.sk"}, 110) = -1 ENOENT (No such file or directory)
close(5) = 0
write(1, "Could not connect to resource gr"..., 44Could not connect to resource group manager
) = 44
exit_group(1) = ?


it dosn't start can you explain why ???????
 
Hi,

it was simply: you made a mistake at /etc/pve/cluster.conf file.

pvecm status at balthazar said me about 2 nodes, but pvecm status at fenix said about only 1 node.

then I go and see that balthazar have version 7 config, but fenix - only version 3. Cluster was broken :)

mistake was here: missing parameter two_node="1" at <cman> section of cluster.conf. When i added it and activate - all nodes at manager bacame green and our VM start success.

And I added fencing config for our drac5 cards. Need add user/pass to drac at bios for check it. We will doing it at monday :)
 

About

The Proxmox community has been around for many years and offers help and support for Proxmox VE, Proxmox Backup Server, and Proxmox Mail Gateway.
We think our community is one of the best thanks to people like you!

Get your subscription!

The Proxmox team works very hard to make sure you are running the best software and getting stable updates and security enhancements, as well as quick enterprise support. Tens of thousands of happy customers have a Proxmox subscription. Get yours easily in our online shop.

Buy now!