Don't like ads? PRO users don't see any ads ;-)
Guest

gmond.conf

By: a guest on Sep 2nd, 2011  |  syntax: None  |  size: 8.24 KB  |  hits: 37  |  expires: Never
download  |  raw  |  embed  |  report abuse  |  print
Text below is selected. Please press Ctrl+C to copy to your clipboard. (⌘+C on Mac)
  1. /* This configuration is as close to 2.5.x default behavior as possible
  2.    The values closely match ./gmond/metric.h definitions in 2.5.x */
  3. globals {
  4.   daemonize = yes
  5.   setuid = yes
  6.   user = nobody
  7.   debug_level = 0
  8.   max_udp_msg_len = 1472
  9.   mute = no
  10.   deaf = no
  11.   allow_extra_data = yes
  12.   host_dmax = 3600 /*secs */
  13.   host_tmax = 20 /*secs */
  14.   cleanup_threshold = 300 /*secs */
  15.   gexec = no
  16.   send_metadata_interval = 0 /*secs */
  17. }
  18.  
  19. /*
  20.  * The cluster attributes specified will be used as part of the <CLUSTER>
  21.  * tag that will wrap all hosts collected by this instance.
  22.  */
  23. cluster {
  24.   name = "compute"
  25.   owner = "unspecified"
  26.   latlong = "unspecified"
  27.   url = "unspecified"
  28. }
  29.  
  30. /* The host section describes attributes of the host, like the location */
  31. host {
  32.   location = "unspecified"
  33. }
  34.  
  35. /* Feel free to specify as many udp_send_channels as you like.  Gmond
  36.    used to only support having a single channel */
  37. udp_send_channel {
  38.   #bind_hostname = yes # Highly recommended, soon to be default.
  39.                        # This option tells gmond to use a source address
  40.                        # that resolves to the machine's hostname.  Without
  41.                        # this, the metrics may appear to come from any
  42.                        # interface and the DNS names associated with
  43.                        # those IPs will be used to create the RRDs.
  44.   mcast_join = 239.2.11.73
  45.   port = 8649
  46.   ttl = 1
  47. }
  48.  
  49. udp_send_channel{
  50.   host = c1
  51.   port = 8649
  52. }
  53.  
  54. udp_send_channel{
  55.   host = c4
  56.   port = 8649
  57. }
  58.  
  59.  
  60. /* You can specify as many udp_recv_channels as you like as well. */
  61. udp_recv_channel {
  62.   mcast_join = 239.2.11.73
  63.   port = 8649
  64.   bind = 239.2.11.73
  65. }
  66.  
  67. /* You can specify as many tcp_accept_channels as you like to share
  68.    an xml description of the state of the cluster */
  69. tcp_accept_channel {
  70.   port = 8649
  71. }
  72.  
  73. /* Channel to receive sFlow datagrams */
  74. #udp_recv_channel {
  75. #  port = 6343
  76. #}
  77.  
  78. /* Optional sFlow settings */
  79. #sflow {
  80. # udp_port = 6343
  81. # accept_vm_metrics = no
  82. #}
  83.  
  84. /* Each metrics module that is referenced by gmond must be specified and
  85.    loaded. If the module has been statically linked with gmond, it does
  86.    not require a load path. However all dynamically loadable modules must
  87.    include a load path. */
  88. modules {
  89.   module {
  90.     name = "core_metrics"
  91.   }
  92.   module {
  93.     name = "cpu_module"
  94.     path = "modcpu.so"
  95.   }
  96.   module {
  97.     name = "disk_module"
  98.     path = "moddisk.so"
  99.   }
  100.   module {
  101.     name = "load_module"
  102.     path = "modload.so"
  103.   }
  104.   module {
  105.     name = "mem_module"
  106.     path = "modmem.so"
  107.   }
  108.   module {
  109.     name = "net_module"
  110.     path = "modnet.so"
  111.   }
  112.   module {
  113.     name = "proc_module"
  114.     path = "modproc.so"
  115.   }
  116.   module {
  117.     name = "sys_module"
  118.     path = "modsys.so"
  119.   }
  120. }
  121.  
  122. /* The old internal 2.5.x metric array has been replaced by the following
  123.    collection_group directives.  What follows is the default behavior for
  124.    collecting and sending metrics that is as close to 2.5.x behavior as
  125.    possible. */
  126.  
  127. /* This collection group will cause a heartbeat (or beacon) to be sent every
  128.    20 seconds.  In the heartbeat is the GMOND_STARTED data which expresses
  129.    the age of the running gmond. */
  130. collection_group {
  131.   collect_once = yes
  132.   time_threshold = 20
  133.   metric {
  134.     name = "heartbeat"
  135.   }
  136. }
  137.  
  138. /* This collection group will send general info about this host every
  139.    1200 secs.
  140.    This information doesn't change between reboots and is only collected
  141.    once. */
  142. collection_group {
  143.   collect_once = yes
  144.   time_threshold = 1200
  145.   metric {
  146.     name = "cpu_num"
  147.     title = "CPU Count"
  148.   }
  149.   metric {
  150.     name = "cpu_speed"
  151.     title = "CPU Speed"
  152.   }
  153.   metric {
  154.     name = "mem_total"
  155.     title = "Memory Total"
  156.   }
  157.   /* Should this be here? Swap can be added/removed between reboots. */
  158.   metric {
  159.     name = "swap_total"
  160.     title = "Swap Space Total"
  161.   }
  162.   metric {
  163.     name = "boottime"
  164.     title = "Last Boot Time"
  165.   }
  166.   metric {
  167.     name = "machine_type"
  168.     title = "Machine Type"
  169.   }
  170.   metric {
  171.     name = "os_name"
  172.     title = "Operating System"
  173.   }
  174.   metric {
  175.     name = "os_release"
  176.     title = "Operating System Release"
  177.   }
  178.   metric {
  179.     name = "location"
  180.     title = "Location"
  181.   }
  182. }
  183.  
  184. /* This collection group will send the status of gexecd for this host
  185.    every 300 secs.*/
  186. /* Unlike 2.5.x the default behavior is to report gexecd OFF. */
  187. collection_group {
  188.   collect_once = yes
  189.   time_threshold = 300
  190.   metric {
  191.     name = "gexec"
  192.     title = "Gexec Status"
  193.   }
  194. }
  195.  
  196. /* This collection group will collect the CPU status info every 20 secs.
  197.    The time threshold is set to 90 seconds.  In honesty, this
  198.    time_threshold could be set significantly higher to reduce
  199.    unneccessary  network chatter. */
  200. collection_group {
  201.   collect_every = 20
  202.   time_threshold = 90
  203.   /* CPU status */
  204.   metric {
  205.     name = "cpu_user"
  206.     value_threshold = "1.0"
  207.     title = "CPU User"
  208.   }
  209.   metric {
  210.     name = "cpu_system"
  211.     value_threshold = "1.0"
  212.     title = "CPU System"
  213.   }
  214.   metric {
  215.     name = "cpu_idle"
  216.     value_threshold = "5.0"
  217.     title = "CPU Idle"
  218.   }
  219.   metric {
  220.     name = "cpu_nice"
  221.     value_threshold = "1.0"
  222.     title = "CPU Nice"
  223.   }
  224.   metric {
  225.     name = "cpu_aidle"
  226.     value_threshold = "5.0"
  227.     title = "CPU aidle"
  228.   }
  229.   metric {
  230.     name = "cpu_wio"
  231.     value_threshold = "1.0"
  232.     title = "CPU wio"
  233.   }
  234.   /* The next two metrics are optional if you want more detail...
  235.      ... since they are accounted for in cpu_system.
  236.   metric {
  237.     name = "cpu_intr"
  238.     value_threshold = "1.0"
  239.     title = "CPU intr"
  240.   }
  241.   metric {
  242.     name = "cpu_sintr"
  243.     value_threshold = "1.0"
  244.     title = "CPU sintr"
  245.   }
  246.   */
  247. }
  248.  
  249. collection_group {
  250.   collect_every = 20
  251.   time_threshold = 90
  252.   /* Load Averages */
  253.   metric {
  254.     name = "load_one"
  255.     value_threshold = "1.0"
  256.     title = "One Minute Load Average"
  257.   }
  258.   metric {
  259.     name = "load_five"
  260.     value_threshold = "1.0"
  261.     title = "Five Minute Load Average"
  262.   }
  263.   metric {
  264.     name = "load_fifteen"
  265.     value_threshold = "1.0"
  266.     title = "Fifteen Minute Load Average"
  267.   }
  268. }
  269.  
  270. /* This group collects the number of running and total processes */
  271. collection_group {
  272.   collect_every = 80
  273.   time_threshold = 950
  274.   metric {
  275.     name = "proc_run"
  276.     value_threshold = "1.0"
  277.     title = "Total Running Processes"
  278.   }
  279.   metric {
  280.     name = "proc_total"
  281.     value_threshold = "1.0"
  282.     title = "Total Processes"
  283.   }
  284. }
  285.  
  286. /* This collection group grabs the volatile memory metrics every 40 secs and
  287.    sends them at least every 180 secs.  This time_threshold can be increased
  288.    significantly to reduce unneeded network traffic. */
  289. collection_group {
  290.   collect_every = 40
  291.   time_threshold = 180
  292.   metric {
  293.     name = "mem_free"
  294.     value_threshold = "1024.0"
  295.     title = "Free Memory"
  296.   }
  297.   metric {
  298.     name = "mem_shared"
  299.     value_threshold = "1024.0"
  300.     title = "Shared Memory"
  301.   }
  302.   metric {
  303.     name = "mem_buffers"
  304.     value_threshold = "1024.0"
  305.     title = "Memory Buffers"
  306.   }
  307.   metric {
  308.     name = "mem_cached"
  309.     value_threshold = "1024.0"
  310.     title = "Cached Memory"
  311.   }
  312.   metric {
  313.     name = "swap_free"
  314.     value_threshold = "1024.0"
  315.     title = "Free Swap Space"
  316.   }
  317. }
  318.  
  319. collection_group {
  320.   collect_every = 40
  321.   time_threshold = 300
  322.   metric {
  323.     name = "bytes_out"
  324.     value_threshold = 4096
  325.     title = "Bytes Sent"
  326.   }
  327.   metric {
  328.     name = "bytes_in"
  329.     value_threshold = 4096
  330.     title = "Bytes Received"
  331.   }
  332.   metric {
  333.     name = "pkts_in"
  334.     value_threshold = 256
  335.     title = "Packets Received"
  336.   }
  337.   metric {
  338.     name = "pkts_out"
  339.     value_threshold = 256
  340.     title = "Packets Sent"
  341.   }
  342. }
  343.  
  344. /* Different than 2.5.x default since the old config made no sense */
  345. collection_group {
  346.   collect_every = 1800
  347.   time_threshold = 3600
  348.   metric {
  349.     name = "disk_total"
  350.     value_threshold = 1.0
  351.     title = "Total Disk Space"
  352.   }
  353. }
  354.  
  355. collection_group {
  356.   collect_every = 40
  357.   time_threshold = 180
  358.   metric {
  359.     name = "disk_free"
  360.     value_threshold = 1.0
  361.     title = "Disk Space Available"
  362.   }
  363.   metric {
  364.     name = "part_max_used"
  365.     value_threshold = 1.0
  366.     title = "Maximum Disk Space Used"
  367.   }
  368. }
  369.  
  370. include ("/etc/conf.d/*.conf")