Ad Widget

Collapse

Agent crashing on start (1.4.2 on x86_64)

Collapse
X
 
  • Time
  • Show
Clear All
new posts
  • osoh
    Junior Member
    • May 2007
    • 11

    #1

    Agent crashing on start (1.4.2 on x86_64)

    Hi,

    I've compiled Zabbix agent (version 1.4.2) in a smp x86_64 system running Red Hat Enterprise Linux 5. The problem is that when I start the agent, it sadly crashes. Using DebugLevel=5 in the zabbix_agentd.conf, I can read:

    Code:
     17973:20071030:145302 zabbix_agentd started. ZABBIX 1.4.2.
     17974:20071030:145302 zabbix_agentd collector started
     17975:20071030:145302 zabbix_agentd listener started
     17976:20071030:145302 zabbix_agentd listener started
     17977:20071030:145302 zabbix_agentd listener started
     17978:20071030:145302 zabbix_agentd active check started [X.X.X.X.:10051]
     17978:20071030:145302 In init_active_metrics()
     17978:20071030:145302 In refresh_metrics('X.X.X.X',10051)
     17978:20071030:145302 get_active_checks('X.X.X.X',10051)
     17978:20071030:145302 Get active checks error: Cannot connect to [X.X.X.X:10051] [No route to host]
     17978:20071030:145302 Getting list of active checks failed. Will retry after 60 seconds
     17973:20071030:145302 One child process died. Exiting ...
     17978:20071030:145302 Got signal. Exiting ...
     17973:20071030:145302 zbx_on_exit() called.
     17975:20071030:145302 Got signal. Exiting ...
     17976:20071030:145302 Got signal. Exiting ...
     17977:20071030:145302 Got signal. Exiting ...
     17973:20071030:145304 ZABBIX Agent stopped
    Obviously, the "X.X.X.X" substitutes the host IP.

    I've got a x86 host running zabbix 1.4.2 with no problems. How could I get track of the trouble?
  • Alexei
    Founder, CEO
    Zabbix Certified Trainer
    Zabbix Certified SpecialistZabbix Certified Professional
    • Sep 2004
    • 5654

    #2
    How many CPUs (cores) the system has?
    Alexei Vladishev
    Creator of Zabbix, Product manager
    New York | Tokyo | Riga
    My Twitter

    Comment

    • derlla
      Junior Member
      • Dec 2007
      • 1

      #3
      I have the same problem on my host.
      Tyan VX50, 16 cores,64G memory.

      Below is the output from strace


      -bash-3.00$ strace ./zabbix_agentd
      execve("./zabbix_agentd", ["./zabbix_agentd"], [/* 20 vars */]) = 0
      uname({sys="Linux", node="lnx40", ...}) = 0
      brk(0) = 0x51d000
      mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x2a95556000
      access("/etc/ld.so.preload", R_OK) = -1 ENOENT (No such file or directory)
      open("/etc/ld.so.cache", O_RDONLY) = 3
      fstat(3, {st_mode=S_IFREG|0644, st_size=148578, ...}) = 0
      mmap(NULL, 148578, PROT_READ, MAP_PRIVATE, 3, 0) = 0x2a95557000
      close(3) = 0
      open("/lib64/tls/libm.so.6", O_RDONLY) = 3
      read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\36 0=0}:"..., 832) = 832
      fstat(3, {st_mode=S_IFREG|0755, st_size=643240, ...}) = 0
      mmap(0x3a7d300000, 1593800, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x3a7d300000
      mprotect(0x3a7d385000, 1049032, PROT_NONE) = 0
      mmap(0x3a7d484000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x84000) = 0x3a7d484000
      close(3) = 0
      open("/lib64/libresolv.so.2", O_RDONLY) = 3
      read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\24 06\220"..., 832) = 832
      fstat(3, {st_mode=S_IFREG|0755, st_size=93544, ...}) = 0
      mmap(0x3a7f900000, 1133256, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x3a7f900000
      mprotect(0x3a7f911000, 1063624, PROT_NONE) = 0
      mmap(0x3a7fa11000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x11000) = 0x3a7fa11000
      mmap(0x3a7fa13000, 6856, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x3a7fa13000
      close(3) = 0
      open("/lib64/tls/libc.so.6", O_RDONLY) = 3
      read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\24 0\304"..., 832) = 832
      fstat(3, {st_mode=S_IFREG|0755, st_size=1622600, ...}) = 0
      mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x2a9557c000
      mmap(0x3a7d000000, 2314184, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x3a7d000000
      mprotect(0x3a7d12c000, 1085384, PROT_NONE) = 0
      mmap(0x3a7d22c000, 20480, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x12c000) = 0x3a7d22c000
      mmap(0x3a7d231000, 16328, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x3a7d231000
      close(3) = 0
      mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x2a9557d000
      mprotect(0x3a7d22c000, 12288, PROT_READ) = 0
      mprotect(0x3a7fa11000, 4096, PROT_READ) = 0
      mprotect(0x3a7d484000, 4096, PROT_READ) = 0
      mprotect(0x3a7cd14000, 4096, PROT_READ) = 0
      arch_prctl(ARCH_SET_FS, 0x2a9557d3c0) = 0
      munmap(0x2a95557000, 148578) = 0
      brk(0) = 0x51d000
      brk(0x53e000) = 0x53e000
      open("/etc/zabbix/zabbix_agentd.conf", O_RDONLY) = 3
      fstat(3, {st_mode=S_IFREG|0644, st_size=2464, ...}) = 0
      mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x2a95557000
      read(3, "# This is config file for zabbix"..., 4096) = 2464
      read(3, "", 4096) = 0
      close(3) = 0
      munmap(0x2a95557000, 4096) = 0
      open("/etc/zabbix/zabbix_agentd.conf", O_RDONLY) = 3
      fstat(3, {st_mode=S_IFREG|0644, st_size=2464, ...}) = 0
      mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x2a95557000
      read(3, "# This is config file for zabbix"..., 4096) = 2464
      read(3, "", 4096) = 0
      close(3) = 0
      munmap(0x2a95557000, 4096) = 0
      getuid() = 1001
      getgid() = 103
      clone(child_stack=0, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGC HLD, child_tidptr=0x2a9557d450) = 7482
      --- SIGCHLD (Child exited) @ 0 (0) ---
      exit_group(0) = ?
      Process 7481 detached

      Comment

      • Alexei
        Founder, CEO
        Zabbix Certified Trainer
        Zabbix Certified SpecialistZabbix Certified Professional
        • Sep 2004
        • 5654

        #4
        This problem happens only for 16 CPU/core servers. It is already fixed. The fix will be available in 1.4.3.
        Alexei Vladishev
        Creator of Zabbix, Product manager
        New York | Tokyo | Riga
        My Twitter

        Comment

        Working...