mirror of
https://github.com/netdata/netdata.git
synced 2025-04-06 06:25:32 +00:00

* rrdset - in progress * rrdset optimal constructor; rrdset conflict * rrdset final touches * re-organization of rrdset object members * prevent use-after-free * dictionary dfe supports also counting of iterations * rrddim managed by dictionary * rrd.h cleanup * DICTIONARY_ITEM now is referencing actual dictionary items in the code * removed rrdset linked list * Revert "removed rrdset linked list" This reverts commit 690d6a588b4b99619c2c5e10f84e8f868ae6def5. * removed rrdset linked list * added comments * Switch chart uuid to static allocation in rrdset Remove unused functions * rrdset_archive() and friends... * always create rrdfamily * enable ml_free_dimension * rrddim_foreach done with dfe * most custom rrddim loops replaced with rrddim_foreach * removed accesses to rrddim->dimensions * removed locks that are no longer needed * rrdsetvar is now managed by the dictionary * set rrdset is rrdsetvar, fixes https://github.com/netdata/netdata/pull/13646#issuecomment-1242574853 * conflict callback of rrdsetvar now properly checks if it has to reset the variable * dictionary registered callbacks accept as first parameter the DICTIONARY_ITEM * dictionary dfe now uses internal counter to report; avoided excess variables defined with dfe * dictionary walkthrough callbacks get dictionary acquired items * dictionary reference counters that can be dupped from zero * added advanced functions for get and del * rrdvar managed by dictionaries * thread safety for rrdsetvar * faster rrdvar initialization * rrdvar string lengths should match in all add, del, get functions * rrdvar internals hidden from the rest of the world * rrdvar is now acquired throughout netdata * hide the internal structures of rrdsetvar * rrdsetvar is now acquired through out netdata * rrddimvar managed by dictionary; rrddimvar linked list removed; rrddimvar structures hidden from the rest of netdata * better error handling * dont create variables if not initialized for health * dont create variables if not initialized for health again * rrdfamily is now managed by dictionaries; references of it are acquired dictionary items * type checking on acquired objects * rrdcalc renaming of functions * type checking for rrdfamily_acquired * rrdcalc managed by dictionaries * rrdcalc double free fix * host rrdvars is always needed * attempt to fix deadlock 1 * attempt to fix deadlock 2 * Remove unused variable * attempt to fix deadlock 3 * snprintfz * rrdcalc index in rrdset fix * Stop storing active charts and computing chart hashes * Remove store active chart function * Remove compute chart hash function * Remove sql_store_chart_hash function * Remove store_active_dimension function * dictionary delayed destruction * formatting and cleanup * zero dictionary base on rrdsetvar * added internal error to log delayed destructions of dictionaries * typo in rrddimvar * added debugging info to dictionary * debug info * fix for rrdcalc keys being empty * remove forgotten unlock * remove deadlock * Switch to metadata version 5 and drop chart_hash chart_hash_map chart_active dimension_active v_chart_hash * SQL cosmetic changes * do not busy wait while destroying a referenced dictionary * remove deadlock * code cleanup; re-organization; * fast cleanup and flushing of dictionaries * number formatting fixes * do not delete configured alerts when archiving a chart * rrddim obsolete linked list management outside dictionaries * removed duplicate contexts call * fix crash when rrdfamily is not initialized * dont keep rrddimvar referenced * properly cleanup rrdvar * removed some locks * Do not attempt to cleanup chart_hash / chart_hash_map * rrdcalctemplate managed by dictionary * register callbacks on the right dictionary * removed some more locks * rrdcalc secondary index replaced with linked-list; rrdcalc labels updates are now executed by health thread * when looking up for an alarm look using both chart id and chart name * host initialization a bit more modular * init rrdlabels on host update * preparation for dictionary views * improved comment * unused variables without internal checks * service threads isolation and worker info * more worker info in service thread * thread cancelability debugging with internal checks * strings data races addressed; fixes https://github.com/netdata/netdata/issues/13647 * dictionary modularization * Remove unused SQL statement definition * unit-tested thread safety of dictionaries; removed data race conditions on dictionaries and strings; dictionaries now can detect if the caller is holds a write lock and automatically all the calls become their unsafe versions; all direct calls to unsafe version is eliminated * remove worker_is_idle() from the exit of service functions, because we lose the lock time between loops * rewritten dictionary to have 2 separate locks, one for indexing and another for traversal * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/proc.plugin/proc_net_dev.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * fix memory leak in rrdset cache_dir * minor dictionary changes * dont use index locks in single threaded * obsolete dict option * rrddim options and flags separation; rrdset_done() optimization to keep array of reference pointers to rrddim; * fix jump on uninitialized value in dictionary; remove double free of cache_dir * addressed codacy findings * removed debugging code * use the private refcount on dictionaries * make dictionary item desctructors work on dictionary destruction; strictier control on dictionary API; proper cleanup sequence on rrddim; * more dictionary statistics * global statistics about dictionary operations, memory, items, callbacks * dictionary support for views - missing the public API * removed warning about unused parameter * chart and context name for cloud * chart and context name for cloud, again * dictionary statistics fixed; first implementation of dictionary views - not currently used * only the master can globally delete an item * context needs netdata prefix * fix context and chart it of spins * fix for host variables when health is not enabled * run garbage collector on item insert too * Fix info message; remove extra "using" * update dict unittest for new placement of garbage collector * we need RRDHOST->rrdvars for maintaining custom host variables * Health initialization needs the host->host_uuid * split STRING to its own files; no code changes other than that * initialize health unconditionally * unit tests do not pollute the global scope with their variables * Skip initialization when creating archived hosts on startup. When a child connects it will initialize properly Co-authored-by: Stelios Fragkakis <52996999+stelfrag@users.noreply.github.com> Co-authored-by: Vladimir Kobal <vlad@prokk.net>
258 lines
10 KiB
C
258 lines
10 KiB
C
// SPDX-License-Identifier: GPL-3.0-or-later
|
|
|
|
#include "rrd.h"
|
|
|
|
#ifndef NETDATA_RRDCALC_H
|
|
#define NETDATA_RRDCALC_H 1
|
|
|
|
// calculated variables (defined in health configuration)
|
|
// These aggregate time-series data at fixed intervals
|
|
// (defined in their update_every member below)
|
|
// They increase the overhead of netdata.
|
|
//
|
|
// These calculations are stored under RRDHOST.
|
|
// Then are also linked to RRDSET (of course only when a
|
|
// matching chart is found).
|
|
|
|
typedef enum {
|
|
RRDCALC_FLAG_DB_ERROR = (1 << 0),
|
|
RRDCALC_FLAG_DB_NAN = (1 << 1),
|
|
// RRDCALC_FLAG_DB_STALE = (1 << 2),
|
|
RRDCALC_FLAG_CALC_ERROR = (1 << 3),
|
|
RRDCALC_FLAG_WARN_ERROR = (1 << 4),
|
|
RRDCALC_FLAG_CRIT_ERROR = (1 << 5),
|
|
RRDCALC_FLAG_RUNNABLE = (1 << 6),
|
|
RRDCALC_FLAG_DISABLED = (1 << 7),
|
|
RRDCALC_FLAG_SILENCED = (1 << 8),
|
|
RRDCALC_FLAG_RUN_ONCE = (1 << 9),
|
|
RRDCALC_FLAG_FROM_TEMPLATE = (1 << 10), // the rrdcalc has been created from a template
|
|
} RRDCALC_FLAGS;
|
|
|
|
typedef enum {
|
|
// This list uses several other options from RRDR_OPTIONS for db lookups.
|
|
// To add an item here, you need to reserve a bit in RRDR_OPTIONS.
|
|
RRDCALC_OPTION_NO_CLEAR_NOTIFICATION = 0x80000000,
|
|
} RRDCALC_OPTIONS;
|
|
|
|
#define RRDCALC_ALL_OPTIONS_EXCLUDING_THE_RRDR_ONES (RRDCALC_OPTION_NO_CLEAR_NOTIFICATION)
|
|
|
|
struct rrdcalc {
|
|
STRING *key; // the unique key in the host's rrdcalc_root_index
|
|
|
|
uint32_t id; // the unique id of this alarm
|
|
uint32_t next_event_id; // the next event id that will be used for this alarm
|
|
|
|
uuid_t config_hash_id; // a predictable hash_id based on specific alert configuration
|
|
|
|
STRING *name; // the name of this alarm
|
|
STRING *chart; // the chart id this should be linked to
|
|
|
|
STRING *exec; // the command to execute when this alarm switches state
|
|
STRING *recipient; // the recipient of the alarm (the first parameter to exec)
|
|
|
|
STRING *classification; // the class that this alarm belongs
|
|
STRING *component; // the component that this alarm refers to
|
|
STRING *type; // type of the alarm
|
|
|
|
STRING *plugin_match; // the plugin name that should be linked to
|
|
SIMPLE_PATTERN *plugin_pattern;
|
|
|
|
STRING *module_match; // the module name that should be linked to
|
|
SIMPLE_PATTERN *module_pattern;
|
|
|
|
STRING *source; // the source of this alarm
|
|
STRING *units; // the units of the alarm
|
|
STRING *original_info; // the original info field before any variable replacement
|
|
STRING *info; // a short description of the alarm
|
|
|
|
int update_every; // update frequency for the alarm
|
|
|
|
// the red and green threshold of this alarm (to be set to the chart)
|
|
NETDATA_DOUBLE green;
|
|
NETDATA_DOUBLE red;
|
|
|
|
// ------------------------------------------------------------------------
|
|
// database lookup settings
|
|
|
|
STRING *dimensions; // the chart dimensions
|
|
STRING *foreach_dimension; // the group of dimensions that the `foreach` will be applied.
|
|
SIMPLE_PATTERN *foreach_dimension_pattern; // used if and only if there is a simple pattern for the chart.
|
|
RRDR_GROUPING group; // grouping method: average, max, etc.
|
|
int before; // ending point in time-series
|
|
int after; // starting point in time-series
|
|
RRDCALC_OPTIONS options; // configuration options
|
|
|
|
// ------------------------------------------------------------------------
|
|
// expressions related to the alarm
|
|
|
|
EVAL_EXPRESSION *calculation; // expression to calculate the value of the alarm
|
|
EVAL_EXPRESSION *warning; // expression to check the warning condition
|
|
EVAL_EXPRESSION *critical; // expression to check the critical condition
|
|
|
|
// ------------------------------------------------------------------------
|
|
// notification delay settings
|
|
|
|
int delay_up_duration; // duration to delay notifications when alarm raises
|
|
int delay_down_duration; // duration to delay notifications when alarm lowers
|
|
int delay_max_duration; // the absolute max delay to apply to this alarm
|
|
float delay_multiplier; // multiplier for all delays when alarms switch status
|
|
// while now < delay_up_to
|
|
|
|
// ------------------------------------------------------------------------
|
|
// notification repeat settings
|
|
|
|
uint32_t warn_repeat_every; // interval between repeating warning notifications
|
|
uint32_t crit_repeat_every; // interval between repeating critical notifications
|
|
|
|
// ------------------------------------------------------------------------
|
|
// Labels settings
|
|
STRING *host_labels; // the label read from an alarm file
|
|
SIMPLE_PATTERN *host_labels_pattern; // the simple pattern of labels
|
|
|
|
// ------------------------------------------------------------------------
|
|
// runtime information
|
|
|
|
RRDCALC_STATUS old_status; // the old status of the alarm
|
|
RRDCALC_STATUS status; // the current status of the alarm
|
|
|
|
NETDATA_DOUBLE value; // the current value of the alarm
|
|
NETDATA_DOUBLE old_value; // the previous value of the alarm
|
|
|
|
RRDCALC_FLAGS run_flags; // check RRDCALC_FLAG_*
|
|
|
|
time_t last_updated; // the last update timestamp of the alarm
|
|
time_t next_update; // the next update timestamp of the alarm
|
|
time_t last_status_change; // the timestamp of the last time this alarm changed status
|
|
time_t last_repeat; // the last time the alarm got repeated
|
|
uint32_t times_repeat; // number of times the alarm got repeated
|
|
|
|
time_t db_after; // the first timestamp evaluated by the db lookup
|
|
time_t db_before; // the last timestamp evaluated by the db lookup
|
|
|
|
time_t delay_up_to_timestamp; // the timestamp up to which we should delay notifications
|
|
int delay_up_current; // the current up notification delay duration
|
|
int delay_down_current; // the current down notification delay duration
|
|
int delay_last; // the last delay we used
|
|
|
|
// ------------------------------------------------------------------------
|
|
// variables this alarm exposes to the rest of the alarms
|
|
|
|
const RRDVAR_ACQUIRED *rrdvar_local;
|
|
const RRDVAR_ACQUIRED *rrdvar_family;
|
|
const RRDVAR_ACQUIRED *rrdvar_host_chart_id;
|
|
const RRDVAR_ACQUIRED *rrdvar_host_chart_name;
|
|
|
|
// ------------------------------------------------------------------------
|
|
// the chart this alarm it is linked to
|
|
|
|
size_t labels_version;
|
|
struct rrdset *rrdset;
|
|
|
|
struct rrdcalc *next;
|
|
struct rrdcalc *prev;
|
|
};
|
|
|
|
#define rrdcalc_name(rc) string2str((rc)->name)
|
|
#define rrdcalc_chart_name(rc) string2str((rc)->chart)
|
|
#define rrdcalc_exec(rc) string2str((rc)->exec)
|
|
#define rrdcalc_recipient(rc) string2str((rc)->recipient)
|
|
#define rrdcalc_classification(rc) string2str((rc)->classification)
|
|
#define rrdcalc_component(rc) string2str((rc)->component)
|
|
#define rrdcalc_type(rc) string2str((rc)->type)
|
|
#define rrdcalc_plugin_match(rc) string2str((rc)->plugin_match)
|
|
#define rrdcalc_module_match(rc) string2str((rc)->module_match)
|
|
#define rrdcalc_source(rc) string2str((rc)->source)
|
|
#define rrdcalc_units(rc) string2str((rc)->units)
|
|
#define rrdcalc_original_info(rc) string2str((rc)->original_info)
|
|
#define rrdcalc_info(rc) string2str((rc)->info)
|
|
#define rrdcalc_dimensions(rc) string2str((rc)->dimensions)
|
|
#define rrdcalc_foreachdim(rc) string2str((rc)->foreach_dimension)
|
|
#define rrdcalc_host_labels(rc) string2str((rc)->host_labels)
|
|
|
|
#define foreach_rrdcalc_in_rrdhost_read(host, rc) \
|
|
dfe_start_read((host)->rrdcalc_root_index, rc) \
|
|
|
|
#define foreach_rrdcalc_in_rrdhost_reentrant(host, rc) \
|
|
dfe_start_reentrant((host)->rrdcalc_root_index, rc)
|
|
|
|
#define foreach_rrdcalc_in_rrdhost_done(rc) \
|
|
dfe_done(rc)
|
|
|
|
struct alert_config {
|
|
STRING *alarm;
|
|
STRING *template_key;
|
|
STRING *os;
|
|
STRING *host;
|
|
STRING *on;
|
|
STRING *families;
|
|
STRING *plugin;
|
|
STRING *module;
|
|
STRING *charts;
|
|
STRING *lookup;
|
|
STRING *calc;
|
|
STRING *warn;
|
|
STRING *crit;
|
|
STRING *every;
|
|
STRING *green;
|
|
STRING *red;
|
|
STRING *exec;
|
|
STRING *to;
|
|
STRING *units;
|
|
STRING *info;
|
|
STRING *classification;
|
|
STRING *component;
|
|
STRING *type;
|
|
STRING *delay;
|
|
STRING *options;
|
|
STRING *repeat;
|
|
STRING *host_labels;
|
|
|
|
STRING *p_db_lookup_dimensions;
|
|
STRING *p_db_lookup_method;
|
|
|
|
uint32_t p_db_lookup_options;
|
|
int32_t p_db_lookup_after;
|
|
int32_t p_db_lookup_before;
|
|
int32_t p_update_every;
|
|
};
|
|
|
|
#define RRDCALC_HAS_DB_LOOKUP(rc) ((rc)->after)
|
|
|
|
extern void rrdcalc_update_info_using_rrdset_labels(RRDCALC *rc);
|
|
|
|
extern void rrdcalc_link_matching_alerts_to_rrdset(RRDSET *st);
|
|
|
|
extern const RRDCALC_ACQUIRED *rrdcalc_from_rrdset_get(RRDSET *st, const char *alert_name);
|
|
extern void rrdcalc_from_rrdset_release(RRDSET *st, const RRDCALC_ACQUIRED *rca);
|
|
extern RRDCALC *rrdcalc_acquired_to_rrdcalc(const RRDCALC_ACQUIRED *rca);
|
|
|
|
extern const char *rrdcalc_status2string(RRDCALC_STATUS status);
|
|
|
|
extern void rrdcalc_free_unused_rrdcalc_loaded_from_config(RRDCALC *rc);
|
|
|
|
extern uint32_t rrdcalc_get_unique_id(RRDHOST *host, STRING *chart, STRING *name, uint32_t *next_event_id);
|
|
extern void rrdcalc_add_from_rrdcalctemplate(RRDHOST *host, RRDCALCTEMPLATE *rt, RRDSET *st, const char *overwrite_alert_name, const char *overwrite_dimensions);
|
|
extern int rrdcalc_add_from_config(RRDHOST *host, RRDCALC *rc);
|
|
|
|
extern void rrdcalc_delete_alerts_not_matching_host_labels_from_all_hosts();
|
|
extern void rrdcalc_delete_alerts_not_matching_host_labels_from_this_host(RRDHOST *host);
|
|
|
|
static inline int rrdcalc_isrepeating(RRDCALC *rc) {
|
|
if (unlikely(rc->warn_repeat_every > 0 || rc->crit_repeat_every > 0)) {
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
extern void rrdcalc_unlink_all_rrdset_alerts(RRDSET *st);
|
|
extern void rrdcalc_delete_all(RRDHOST *host);
|
|
|
|
extern void rrdcalc_rrdhost_index_init(RRDHOST *host);
|
|
extern void rrdcalc_rrdhost_index_destroy(RRDHOST *host);
|
|
|
|
#define RRDCALC_VAR_MAX 100
|
|
#define RRDCALC_VAR_FAMILY "$family"
|
|
#define RRDCALC_VAR_LABEL "$label:"
|
|
#define RRDCALC_VAR_LABEL_LEN (sizeof(RRDCALC_VAR_LABEL)-1)
|
|
|
|
#endif //NETDATA_RRDCALC_H
|