2 * collectd - src/threshold.c
3 * Copyright (C) 2007-2010 Florian Forster
4 * Copyright (C) 2008-2009 Sebastian Harl
5 * Copyright (C) 2009 Andrés J. Díaz
6 * Copyright (C) 2014 Pierre-Yves Ritschard
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of the GNU General Public License as published by the
10 * Free Software Foundation; only version 2 of the License is applicable.
12 * This program is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
17 * You should have received a copy of the GNU General Public License along
18 * with this program; if not, write to the Free Software Foundation, Inc.,
19 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
22 * Pierre-Yves Ritschard <pyr at spootnik.org>
23 * Florian octo Forster <octo at collectd.org>
24 * Sebastian Harl <sh at tokkee.org>
25 * Andrés J. Díaz <ajdiaz at connectical.com>
32 #include "utils_avltree.h"
33 #include "utils_cache.h"
34 #include "utils_threshold.h"
35 #include "write_riemann_threshold.h"
38 * Threshold management
39 * ====================
40 * The following functions add, delete, etc. configured thresholds to
41 * the underlying AVL trees.
45 * int ut_check_one_data_source
47 * Checks one data source against the given threshold configuration. If the
48 * `DataSource' option is set in the threshold, and the name does NOT match,
49 * `okay' is returned. If the threshold does match, its failure and warning
50 * min and max values are checked and `failure' or `warning' is returned if
54 static int ut_check_one_data_source(
55 const data_set_t *ds, const value_list_t __attribute__((unused)) * vl,
56 const threshold_t *th, const gauge_t *values, int ds_index) { /* {{{ */
60 int prev_state = STATE_OKAY;
62 /* check if this threshold applies to this data source */
64 ds_name = ds->ds[ds_index].name;
65 if ((th->data_source[0] != 0) && (strcmp(ds_name, th->data_source) != 0))
69 if ((th->flags & UT_FLAG_INVERT) != 0) {
74 /* XXX: This is an experimental code, not optimized, not fast, not reliable,
75 * and probably, do not work as you expect. Enjoy! :D */
76 if ((th->hysteresis > 0) &&
77 ((prev_state = uc_get_state(ds, vl)) != STATE_OKAY)) {
80 if ((!isnan(th->failure_min) &&
81 ((th->failure_min + th->hysteresis) < values[ds_index])) ||
82 (!isnan(th->failure_max) &&
83 ((th->failure_max - th->hysteresis) > values[ds_index])))
88 if ((!isnan(th->warning_min) &&
89 ((th->warning_min + th->hysteresis) < values[ds_index])) ||
90 (!isnan(th->warning_max) &&
91 ((th->warning_max - th->hysteresis) > values[ds_index])))
96 } else { /* no hysteresis */
97 if ((!isnan(th->failure_min) && (th->failure_min > values[ds_index])) ||
98 (!isnan(th->failure_max) && (th->failure_max < values[ds_index])))
101 if ((!isnan(th->warning_min) && (th->warning_min > values[ds_index])) ||
102 (!isnan(th->warning_max) && (th->warning_max < values[ds_index])))
110 return STATE_WARNING;
113 } /* }}} int ut_check_one_data_source */
116 * int ut_check_one_threshold
118 * Checks all data sources of a value list against the given threshold, using
119 * the ut_check_one_data_source function above. Returns the worst status,
120 * which is `okay' if nothing has failed.
121 * Returns less than zero if the data set doesn't have any data sources.
123 static int ut_check_one_threshold(const data_set_t *ds, const value_list_t *vl,
124 const threshold_t *th, const gauge_t *values,
125 int *statuses) { /* {{{ */
128 gauge_t values_copy[ds->ds_num];
130 memcpy(values_copy, values, sizeof(values_copy));
132 if ((th->flags & UT_FLAG_PERCENTAGE) != 0) {
136 if (ds->ds_num == 1) {
138 "ut_check_one_threshold: The %s type has only one data "
139 "source, but you have configured to check this as a percentage. "
140 "That doesn't make much sense, because the percentage will always "
145 /* Prepare `sum' and `num'. */
146 for (size_t i = 0; i < ds->ds_num; i++)
147 if (!isnan(values[i])) {
152 if ((num == 0) /* All data sources are undefined. */
153 || (sum == 0.0)) /* Sum is zero, cannot calculate percentage. */
155 for (size_t i = 0; i < ds->ds_num; i++)
156 values_copy[i] = NAN;
157 } else /* We can actually calculate the percentage. */
159 for (size_t i = 0; i < ds->ds_num; i++)
160 values_copy[i] = 100.0 * values[i] / sum;
162 } /* if (UT_FLAG_PERCENTAGE) */
164 for (size_t i = 0; i < ds->ds_num; i++) {
165 status = ut_check_one_data_source(ds, vl, th, values_copy, i);
168 if (statuses[i] < status)
169 statuses[i] = status;
171 } /* for (ds->ds_num) */
174 } /* }}} int ut_check_one_threshold */
177 * int ut_check_threshold
179 * Gets a list of matching thresholds and searches for the worst status by one
180 * of the thresholds. Then reports that status using the ut_report_state
182 * Returns zero on success and if no threshold has been configured. Returns
183 * less than zero on failure.
185 int write_riemann_threshold_check(const data_set_t *ds, const value_list_t *vl,
186 int *statuses) { /* {{{ */
191 assert(vl->values_len > 0);
192 memset(statuses, 0, vl->values_len * sizeof(*statuses));
194 if (threshold_tree == NULL)
197 /* Is this lock really necessary? So far, thresholds are only inserted at
199 pthread_mutex_lock(&threshold_lock);
200 th = threshold_search(vl);
201 pthread_mutex_unlock(&threshold_lock);
205 DEBUG("ut_check_threshold: Found matching threshold(s)");
207 values = uc_get_rate(ds, vl);
212 status = ut_check_one_threshold(ds, vl, th, values, statuses);
214 ERROR("ut_check_threshold: ut_check_one_threshold failed.");
225 } /* }}} int ut_check_threshold */