Ad Widget

Collapse

Zabbix dies after start

Collapse
X
 
  • Time
  • Show
Clear All
new posts
  • Inakrin
    Junior Member
    • Dec 2009
    • 10

    #1

    Zabbix dies after start

    Zabbix dies after start. It's end of log file


    28403:20100210:222125.029 In delete_history(history_text,200200000010033,7,1265 804484)
    28403:20100210:222125.029 Query [txnlev:0] [select min(clock) from history_text where itemid=200200000010033]
    28403:20100210:222125.030 In delete_history(history_log,200200000010033,7,12658 04484)
    28403:20100210:222125.030 Query [txnlev:0] [select min(clock) from history_log where itemid=200200000010033]
    28403:20100210:222125.031 In delete_history(trends,200200000010033,365,12658044 84)
    28403:20100210:222125.031 Query [txnlev:0] [select min(clock) from trends where itemid=200200000010033]
    28403:20100210:222125.032 In delete_history(trends_uint,200200000010033,365,126 5804484)
    28403:20100210:222125.032 Query [txnlev:0] [select min(clock) from trends_uint where itemid=200200000010033]
    28403:20100210:222125.032 In delete_history(history,200200000010036,7,126580448 4)
    28403:20100210:222125.032 Query [txnlev:0] [select min(clock) from history where itemid=200200000010036]
    28403:20100210:222125.033 In delete_history(history_uint,200200000010036,7,1265 804484)
    28403:20100210:222125.033 Query [txnlev:0] [select min(clock) from history_uint where itemid=200200000010036]
    28405:20100210:222125.034 In update_maintenance_hosts()
    28405:20100210:222125.034 Query [txnlev:1] [select hostid,maintenance_type,maintenance_from from hosts where status=0 and maintenance_status=1]
    28403:20100210:222125.034 In delete_history(history_str,200200000010036,7,12658 04484)
    28403:20100210:222125.034 Query [txnlev:0] [select min(clock) from history_str where itemid=200200000010036]
    28405:20100210:222125.034 End of update_maintenance_hosts()
    28403:20100210:222125.035 In delete_history(history_text,200200000010036,7,1265 804484)
    28403:20100210:222125.035 Query [txnlev:0] [select min(clock) from history_text where itemid=200200000010036]
    28403:20100210:222125.036 In delete_history(history_log,200200000010036,7,12658 04484)
    28403:20100210:222125.036 Query [txnlev:0] [select min(clock) from history_log where itemid=200200000010036]
    28403:20100210:222125.037 In delete_history(trends,200200000010036,365,12658044 84)
    28403:20100210:222125.037 Query [txnlev:0] [select min(clock) from trends where itemid=200200000010036]
    28378:20100210:222125.037 In init_config()
    28378:20100210:222125.037 Query [txnlev:0] [select mt.mediatypeid, mt.type, mt.description, mt.smtp_server, mt.smtp_helo, mt.smtp_email, mt.exec_path, mt.gsm_modem, mt.username, mt.passwd, m.mediaid,m.userid,m.mediatypeid,m.sendto,m.severi ty,m.period from media m, users_groups u, config c,media_type mt where m.userid=u.userid and u.usrgrpid=c.alert_usrgrpid and m.mediatypeid=mt.mediatypeid and m.active=0]
    28383:20100210:222125.036 In get_values()
    28403:20100210:222125.038 In delete_history(trends_uint,200200000010036,365,126 5804484)
    28403:20100210:222125.038 Query [txnlev:0] [select min(clock) from trends_uint where itemid=200200000010036]
    28383:20100210:222125.038 In DCinit_nextchecks()
    28403:20100210:222125.039 In delete_history(history,200200000010037,7,126580448 4)
    28403:20100210:222125.039 Query [txnlev:0] [select min(clock) from history where itemid=200200000010037]
    28383:20100210:222125.039 In DCconfig_get_poller_items() poller_type:0 poller_num:2
    28403:20100210:222125.040 In delete_history(history_uint,200200000010037,7,1265 804484)
    28403:20100210:222125.040 Query [txnlev:0] [select min(clock) from history_uint where itemid=200200000010037]
    28383:20100210:222125.040 End of DCconfig_get_poller_items():0
    28383:20100210:222125.040 In DCflush_nextchecks()
    28403:20100210:222125.040 In delete_history(history_str,200200000010037,7,12658 04484)
    28403:20100210:222125.041 Query [txnlev:0] [select min(clock) from history_str where itemid=200200000010037]
    28403:20100210:222125.041 In delete_history(history_text,200200000010037,7,1265 804484)
    28403:20100210:222125.041 Query [txnlev:0] [select min(clock) from history_text where itemid=200200000010037]
    28378:20100210:222125.042 In ping_database()
    28403:20100210:222125.042 In delete_history(history_log,200200000010037,7,12658 04484)
    28403:20100210:222125.042 Query [txnlev:0] [select min(clock) from history_log where itemid=200200000010037]
    28383:20100210:222125.042 End of get_values()
    28383:20100210:222125.043 In DCconfig_get_normal_poller_nextcheck() poller_type:0 poller_num:2
    28383:20100210:222125.043 End of DCconfig_get_normal_poller_nextcheck():-1
    28403:20100210:222125.043 In delete_history(trends,200200000010037,365,12658044 84)
    28403:20100210:222125.043 Query [txnlev:0] [select min(clock) from trends where itemid=200200000010037]
    28403:20100210:222125.044 In delete_history(trends_uint,200200000010037,365,126 5804484)
    28403:20100210:222125.044 Query [txnlev:0] [select min(clock) from trends_uint where itemid=200200000010037]
    28403:20100210:222125.044 In delete_history(history,200200000010038,7,126580448 4)
    28403:20100210:222125.044 Query [txnlev:0] [select min(clock) from history where itemid=200200000010038]
    28403:20100210:222125.045 In delete_history(history_uint,200200000010038,7,1265 804484)
    28403:20100210:222125.045 Query [txnlev:0] [select min(clock) from history_uint where itemid=200200000010038]
    28383:20100210:222125.043 Poller #2 spent 0.006236 seconds while updating 0 values. Sleeping for 5 seconds
    28403:20100210:222125.046 In delete_history(history_str,200200000010038,7,12658 04484)
    28403:20100210:222125.046 Query [txnlev:0] [select min(clock) from history_str where itemid=200200000010038]
    28403:20100210:222125.047 In delete_history(history_text,200200000010038,7,1265 804484)
    28403:20100210:222125.047 Query [txnlev:0] [select min(clock) from history_text where itemid=200200000010038]
    28403:20100210:222125.048 In delete_history(history_log,200200000010038,7,12658 04484)
    28403:20100210:222125.048 Query [txnlev:0] [select min(clock) from history_log where itemid=200200000010038]
    28378:20100210:222125.048 One child process died (PID:28414). Exiting ...
    28403:20100210:222125.048 In delete_history(trends,200200000010038,365,12658044 84)
    28378:20100210:222127.054 Connect to the database
    28378:20100210:222127.241 In free_database_cache()
    28378:20100210:222127.241 In DCsync_all()
    28378:20100210:222127.241 In DCsync_history(history_first:0 history_num:0)
    28378:20100210:222127.241 Syncing history data...
    28378:20100210:222127.241 In DCsync_trends() trends_num:0
    28378:20100210:222127.241 Syncing trends data...
    28378:20100210:222127.241 Syncing trends data...done.
    28378:20100210:222127.242 End of DCsync_trends()
    28378:20100210:222127.242 End of DCsync_all()
    28378:20100210:222127.242 End of free_database_cache()
    28378:20100210:222127.242 In free_configuration_cache()
    28378:20100210:222127.242 End of free_configuration_cache()
    28378:20100210:222127.247 Zabbix Server stopped. Zabbix 1.8.1 (revision 9702).
  • Inakrin
    Junior Member
    • Dec 2009
    • 10

    #2
    This is full log with debug 4
    Attached Files

    Comment

    • hjansen
      Junior Member
      • Feb 2010
      • 3

      #3
      i have the same problem

      6378:20100212:153444.877 Starting zabbix_server. Zabbix 1.8.1 (revision 9702).
      6378:20100212:153444.910 **** Enabled features ****
      6378:20100212:153444.935 SNMP monitoring: NO
      6378:20100212:153444.962 IPMI monitoring: NO
      6378:20100212:153444.985 WEB monitoring: NO
      6378:20100212:153445.010 Jabber notifications: NO
      6378:20100212:153445.031 ODBC: NO
      6378:20100212:153445.084 SSH2 support: NO
      6378:20100212:153445.131 IPv6 support: NO
      6378:20100212:153445.158 **************************
      6378:20100212:153445.198 Connect to the database
      6378:20100212:153445.397 Query [txnlev:0] [SET NAMES utf8]
      6378:20100212:153445.426 Query [txnlev:0] [SET CHARACTER SET utf8]
      6378:20100212:153445.455 Query [txnlev:0] [select refresh_unsupported from config where 1=1 and configid between 000000000000000 and 099999999999999]
      6378:20100212:153445.478 Query [txnlev:0] [select masterid from nodes where nodeid=0]
      6378:20100212:153445.509 In DBupdate_triggers_after_restart()
      6378:20100212:153445.531 Query [txnlev:1] [begin;]
      6378:20100212:153445.547 Query [txnlev:1] [select distinct t.triggerid,t.expression,t.description,t.status,t. priority,t.value,t.url,t.comments from hosts h,items i,triggers t,functions f where h.hostid=i.hostid and i.itemid=f.itemid and f.triggerid=t.triggerid and h.status in (0) and i.status in (0) and t.status in (0) and i.type not in (2) and i.key_ not in ('status','zabbix[log]')]
      6378:20100212:153445.593 Query [txnlev:1] [commit;]
      6378:20100212:153445.627 End of DBupdate_triggers_after_restart()
      6378:20100212:153445.653 In init_database_cache() size:29361112
      6378:20100212:153445.689 In init_configuration_cache() size:8388608
      6380:20100212:153445.717 server #2 started [Alerter]
      6385:20100212:153445.720 server #7 started [Escalator]
      6379:20100212:153445.747 server #1 started [DB Cache]
      6382:20100212:153445.747 server #4 started [Timer]
      6381:20100212:153445.718 server #3 started [Housekeeper]
      6378:20100212:153445.766 server #0 started [Watchdog]
      6379:20100212:153445.792 In main_dbconfig_loop()
      6384:20100212:153445.764 server #6 started [DB Syncer]
      6380:20100212:153445.804 Connect to the database
      6383:20100212:153445.790 server #5 started [Node watcher. Node ID:0]
      6385:20100212:153445.803 In main_escalator_loop()
      6382:20100212:153445.823 Connect to the database
      6379:20100212:153445.825 Connect to the database
      6378:20100212:153445.855 In main_watchdog_loop()
      6384:20100212:153445.857 In main_dbsyncer_loop()
      6385:20100212:153445.860 Connect to the database
      6383:20100212:153445.859 In main_nodeupdater_loop()
      6380:20100212:153445.877 Query [txnlev:0] [SET NAMES utf8]
      6382:20100212:153445.878 Query [txnlev:0] [SET NAMES utf8]
      6379:20100212:153445.886 Query [txnlev:0] [SET NAMES utf8]
      6378:20100212:153445.899 Connect to the database
      6383:20100212:153445.900 Starting sync with nodes
      6384:20100212:153445.901 Connect to the database
      6385:20100212:153445.903 Query [txnlev:0] [SET NAMES utf8]
      6380:20100212:153445.904 Query [txnlev:0] [SET CHARACTER SET utf8]
      6382:20100212:153445.928 Query [txnlev:0] [SET CHARACTER SET utf8]
      6383:20100212:153445.928 Connect to the database
      6379:20100212:153445.957 Query [txnlev:0] [SET CHARACTER SET utf8]
      6380:20100212:153445.959 Query [txnlev:0] [select a.alertid,a.mediatypeid,a.sendto,a.subject,a.messa ge,a.status,mt.mediatypeid,mt.type,mt.description, mt.smtp_server,mt.smtp_helo,mt.smtp_email,mt.exec_ path,mt.gsm_modem,mt.username,mt.passwd,a.retries from alerts a,media_type mt where a.status=0 and a.mediatypeid=mt.mediatypeid and a.alerttype=0 and mt.mediatypeid between 000000000000000 and 099999999999999 order by a.clock]
      6385:20100212:153445.959 Query [txnlev:0] [SET CHARACTER SET utf8]
      6378:20100212:153445.960 Query [txnlev:0] [SET NAMES utf8]
      6382:20100212:153446.020 Query [txnlev:0] [select distinct i.itemid,i.key_,h.host,h.port,i.delay,i.descriptio n,i.type,h.useip,h.ip,i.history,i.lastvalue,i.prev value,i.hostid,i.value_type,i.delta,i.prevorgvalue ,i.lastclock,i.units,i.multiplier,i.formula,i.stat us,i.valuemapid,h.dns,i.trends,i.lastlogsize,i.dat a_type,i.mtime from hosts h,items i, functions f where h.hostid=i.hostid and h.status=0 and i.status=0 and f.function in ('nodata','date','dayofweek','time','now') and i.itemid=f.itemid and (h.maintenance_status=0 or h.maintenance_type=0) and h.hostid between 000000000000000 and 099999999999999]
      6384:20100212:153446.015 Query [txnlev:0] [SET NAMES utf8]
      6379:20100212:153446.025 Syncing ...
      6385:20100212:153446.033 In process_escalations()
      6383:20100212:153446.023 Query [txnlev:0] [SET NAMES utf8]
      6378:20100212:153446.031 Query [txnlev:0] [SET CHARACTER SET utf8]
      6379:20100212:153446.050 In DCsync_confguration()
      6384:20100212:153446.060 Query [txnlev:0] [SET CHARACTER SET utf8]
      6385:20100212:153446.078 Query [txnlev:0] [select escalationid,actionid,triggerid,eventid,r_eventid, esc_step,status from escalations where status in (0,1) and nextcheck<=1265985286 and escalationid between 000000000000000 and 099999999999999]
      6382:20100212:153446.080 In process_maintenance()
      6379:20100212:153446.095 In DCsync_hosts()
      6378:20100212:153446.100 In init_config()
      6384:20100212:153446.124 Syncing ...
      6383:20100212:153446.106 Query [txnlev:0] [SET CHARACTER SET utf8]
      6385:20100212:153446.133 Escalator spent 0.080761 seconds while processing escalation items. Nextcheck after 3 sec.
      6379:20100212:153446.136 Query [txnlev:0] [select hostid,proxy_hostid,host,useip,ip,dns,port,status, useipmi,ipmi_ip,ipmi_port,ipmi_authtype,ipmi_privi lege,ipmi_username,ipmi_password,maintenance_statu s,maintenance_type,maintenance_from,errors_from,av ailable,disable_until,snmp_errors_from,snmp_availa ble,snmp_disable_until,ipmi_errors_from,ipmi_avail able,ipmi_disable_until from hosts where status in (0) and hostid between 000000000000000 and 099999999999999 order by hostid]
      6382:20100212:153446.134 Query [txnlev:0] [select m.maintenanceid,m.maintenance_type,m.active_since, tp.timeperiod_type,tp.every,tp.month,tp.dayofweek, tp.day,tp.start_time,tp.period,tp.start_date from maintenances m,maintenances_windows mw,timeperiods tp where m.maintenanceid=mw.maintenanceid and mw.timeperiodid=tp.timeperiodid and 1265985286 between m.active_since and m.active_till]
      6378:20100212:153446.161 Query [txnlev:0] [select mt.mediatypeid, mt.type, mt.description, mt.smtp_server, mt.smtp_helo, mt.smtp_email, mt.exec_path, mt.gsm_modem, mt.username, mt.passwd, m.mediaid,m.userid,m.mediatypeid,m.sendto,m.severi ty,m.period from media m, users_groups u, config c,media_type mt where m.userid=u.userid and u.usrgrpid=c.alert_usrgrpid and m.mediatypeid=mt.mediatypeid and m.active=0]
      6384:20100212:153446.176 In DCsync_history(history_first:0 history_num:0)
      6383:20100212:153446.175 In main_historysender()
      6382:20100212:153446.212 In update_maintenance_hosts()
      6378:20100212:153446.234 One child process died (PID:6379). Exiting ...
      6384:20100212:153446.240 DB syncer spent 0.061523 second while processing 0 items. Nextsync after 5 sec.
      6383:20100212:153446.255 Sleeping 9 seconds
      6378:20100212:153448.298 Connect to the database
      6378:20100212:153448.346 Query [txnlev:0] [SET NAMES utf8]
      6378:20100212:153448.395 Query [txnlev:0] [SET CHARACTER SET utf8]
      6378:20100212:153448.439 In free_database_cache()
      6378:20100212:153448.480 In DCsync_all()
      6378:20100212:153448.548 In DCsync_history(history_first:0 history_num:0)
      6378:20100212:153448.592 Syncing history data...
      6378:20100212:153448.630 In DCsync_trends() trends_num:0
      6378:20100212:153448.687 Syncing trends data...
      6378:20100212:153448.741 Syncing trends data...done.
      6378:20100212:153448.774 End of DCsync_trends()
      6378:20100212:153448.811 End of DCsync_all()
      6378:20100212:153448.862 End of free_database_cache()
      6378:20100212:153448.909 In free_configuration_cache()

      Comment

      • s.ivlenkov
        Junior Member
        • Jan 2010
        • 5

        #4
        zabbix_server die after start

        If you solve this problem, please, post solution.
        I have the same problem.

        zabbix_server 1.8.1 One child process died die after start. (Solaris 10, MySQL 5.0.67). After that all zabbix processes marks as <defunct>

        $ grep 713 zabbix_server.log

        713:20100311:115621.297 Query [txnlev:0] [select hostid,proxy_hostid,host,useip,ip,dns,port,status, useipmi,ipmi_ip,ipmi_port,ipmi_authtype,ipmi_privi lege,ipmi_username,ipmi_password,maintenance_statu s,maintenance_type,maintenance_from,errors_from,av ailable,disable_until,snmp_errors_from,snmp_availa ble,snmp_disable_until,ipmi_errors_from,ipmi_avail able,ipmi_disable_until from hosts where status in (0) and hostid between 000000000000000 and 099999999999999 order by hostid]
        722:20100311:115622.713 In delete_history(trends_uint,17005,365,1268297782)
        722:20100311:115622.713 Query [txnlev:0] [select min(clock) from trends_uint where itemid=17005]
        722:20100311:115622.713 In delete_history(history,17006,7,1268297782)
        722:20100311:115622.713 Query [txnlev:0] [select min(clock) from history where itemid=17006]
        722:20100311:115622.713 In delete_history(history_uint,17006,7,1268297782)
        712:20100311:115623.442 One child process died (PID:713). Exiting ...

        Comment

        • Inakrin
          Junior Member
          • Dec 2009
          • 10

          #5
          Solution

          Yes, i solve this problem. You need use packages from coolstack (http://cooltools.sunsource.net/coolstack/)
          After compiling with 32-bit mysql libs from coolstack all works correctly.

          Comment

          • s.ivlenkov
            Junior Member
            • Jan 2010
            • 5

            #6
            Thanks.
            But in my case it doesn't helps.

            I tried mysql32 from coolstack, I even tried to link zabbix_server with postgresql (from sunfreeware).

            Problem remains the same.
            I've opened the case ZBX-2153.

            zabbix 1.8.1, Solaris 10.

            Comment

            • treelowa
              Junior Member
              • Apr 2010
              • 6

              #7
              Originally posted by s.ivlenkov
              Thanks.
              But in my case it doesn't helps.

              I tried mysql32 from coolstack, I even tried to link zabbix_server with postgresql (from sunfreeware).

              Problem remains the same.
              I've opened the case ZBX-2153.

              zabbix 1.8.1, Solaris 10.
              I am using 1.8.2, solaris 10, with bin mysql 5 release and have the same issue. As soon as I enable any server, even Zabbix server to be monitored the server process crash. If you have any update I would love to hear about it.

              Many thanks.

              Comment

              • s.ivlenkov
                Junior Member
                • Jan 2010
                • 5

                #8
                Originally posted by treelowa
                I am using 1.8.2, solaris 10, with bin mysql 5 release and have the same issue. As soon as I enable any server, even Zabbix server to be monitored the server process crash.
                Please, take a look at https://support.zabbix.com/browse/ZBX-2153

                Fix from Marco Walther (18/Mar/10 02:37 AM) helps in my case.

                The problem is in src/libs/zbxdbcache/dbconfig.c: The first struct in the shared memory segment (ZBX_DC_CONFIG)
                needs only 4-byte alignment, while all the following contain zbx_uint64_t elements and need 8-byte alignment. There
                are some `int's in there but they will always be allocated in multiples of four, so they don't influence the alignment.

                That will work pretty well on x86 which does not show those mis-alignment problems. But SPARC will fail because it
                normally enforces the alignment. There are compiler switches, but they will create a big runtime penalty.

                The fix is, to make sure, the size of ZBX_DC_CONFIG is a multiple of the biggest alignment.


                Code:
                 
                --- zabbix-1.8.1.orig/src/libs/zbxdbcache/dbconfig.c 2010-01-27 13:22:44.000000000 -0800 
                +++ zabbix-1.8.1/src/libs/zbxdbcache/dbconfig.c 2010-03-17 18:06:47.377350002 -0700 
                @@ -2165,6 +2165,12 @@ 
                
                        sz = sizeof(ZBX_DC_CONFIG); 
                
                +#ifndef ORIGINAL 
                + if (sz % sizeof(zbx_uint64_t) != 0) { 
                + sz = (sz / sizeof(zbx_uint64_t) + 1) * sizeof(zbx_uint64_t); 
                + } 
                +#endif 
                + 
                        if (CONFIG_DBCONFIG_SIZE < sz) 
                        { 
                                zbx_error("Configuration buffer is too small. Please increase CacheSize parameter.");

                Comment

                • treelowa
                  Junior Member
                  • Apr 2010
                  • 6

                  #9
                  Thanks,

                  I am not exactly sure what I supposed to change. I am no developer so any help would be appreciated.

                  Thanks

                  Comment

                  Working...