mirror of
https://github.com/netdata/netdata.git
synced 2025-04-14 09:38:34 +00:00

* rrdset - in progress * rrdset optimal constructor; rrdset conflict * rrdset final touches * re-organization of rrdset object members * prevent use-after-free * dictionary dfe supports also counting of iterations * rrddim managed by dictionary * rrd.h cleanup * DICTIONARY_ITEM now is referencing actual dictionary items in the code * removed rrdset linked list * Revert "removed rrdset linked list" This reverts commit 690d6a588b4b99619c2c5e10f84e8f868ae6def5. * removed rrdset linked list * added comments * Switch chart uuid to static allocation in rrdset Remove unused functions * rrdset_archive() and friends... * always create rrdfamily * enable ml_free_dimension * rrddim_foreach done with dfe * most custom rrddim loops replaced with rrddim_foreach * removed accesses to rrddim->dimensions * removed locks that are no longer needed * rrdsetvar is now managed by the dictionary * set rrdset is rrdsetvar, fixes https://github.com/netdata/netdata/pull/13646#issuecomment-1242574853 * conflict callback of rrdsetvar now properly checks if it has to reset the variable * dictionary registered callbacks accept as first parameter the DICTIONARY_ITEM * dictionary dfe now uses internal counter to report; avoided excess variables defined with dfe * dictionary walkthrough callbacks get dictionary acquired items * dictionary reference counters that can be dupped from zero * added advanced functions for get and del * rrdvar managed by dictionaries * thread safety for rrdsetvar * faster rrdvar initialization * rrdvar string lengths should match in all add, del, get functions * rrdvar internals hidden from the rest of the world * rrdvar is now acquired throughout netdata * hide the internal structures of rrdsetvar * rrdsetvar is now acquired through out netdata * rrddimvar managed by dictionary; rrddimvar linked list removed; rrddimvar structures hidden from the rest of netdata * better error handling * dont create variables if not initialized for health * dont create variables if not initialized for health again * rrdfamily is now managed by dictionaries; references of it are acquired dictionary items * type checking on acquired objects * rrdcalc renaming of functions * type checking for rrdfamily_acquired * rrdcalc managed by dictionaries * rrdcalc double free fix * host rrdvars is always needed * attempt to fix deadlock 1 * attempt to fix deadlock 2 * Remove unused variable * attempt to fix deadlock 3 * snprintfz * rrdcalc index in rrdset fix * Stop storing active charts and computing chart hashes * Remove store active chart function * Remove compute chart hash function * Remove sql_store_chart_hash function * Remove store_active_dimension function * dictionary delayed destruction * formatting and cleanup * zero dictionary base on rrdsetvar * added internal error to log delayed destructions of dictionaries * typo in rrddimvar * added debugging info to dictionary * debug info * fix for rrdcalc keys being empty * remove forgotten unlock * remove deadlock * Switch to metadata version 5 and drop chart_hash chart_hash_map chart_active dimension_active v_chart_hash * SQL cosmetic changes * do not busy wait while destroying a referenced dictionary * remove deadlock * code cleanup; re-organization; * fast cleanup and flushing of dictionaries * number formatting fixes * do not delete configured alerts when archiving a chart * rrddim obsolete linked list management outside dictionaries * removed duplicate contexts call * fix crash when rrdfamily is not initialized * dont keep rrddimvar referenced * properly cleanup rrdvar * removed some locks * Do not attempt to cleanup chart_hash / chart_hash_map * rrdcalctemplate managed by dictionary * register callbacks on the right dictionary * removed some more locks * rrdcalc secondary index replaced with linked-list; rrdcalc labels updates are now executed by health thread * when looking up for an alarm look using both chart id and chart name * host initialization a bit more modular * init rrdlabels on host update * preparation for dictionary views * improved comment * unused variables without internal checks * service threads isolation and worker info * more worker info in service thread * thread cancelability debugging with internal checks * strings data races addressed; fixes https://github.com/netdata/netdata/issues/13647 * dictionary modularization * Remove unused SQL statement definition * unit-tested thread safety of dictionaries; removed data race conditions on dictionaries and strings; dictionaries now can detect if the caller is holds a write lock and automatically all the calls become their unsafe versions; all direct calls to unsafe version is eliminated * remove worker_is_idle() from the exit of service functions, because we lose the lock time between loops * rewritten dictionary to have 2 separate locks, one for indexing and another for traversal * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/proc.plugin/proc_net_dev.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * fix memory leak in rrdset cache_dir * minor dictionary changes * dont use index locks in single threaded * obsolete dict option * rrddim options and flags separation; rrdset_done() optimization to keep array of reference pointers to rrddim; * fix jump on uninitialized value in dictionary; remove double free of cache_dir * addressed codacy findings * removed debugging code * use the private refcount on dictionaries * make dictionary item desctructors work on dictionary destruction; strictier control on dictionary API; proper cleanup sequence on rrddim; * more dictionary statistics * global statistics about dictionary operations, memory, items, callbacks * dictionary support for views - missing the public API * removed warning about unused parameter * chart and context name for cloud * chart and context name for cloud, again * dictionary statistics fixed; first implementation of dictionary views - not currently used * only the master can globally delete an item * context needs netdata prefix * fix context and chart it of spins * fix for host variables when health is not enabled * run garbage collector on item insert too * Fix info message; remove extra "using" * update dict unittest for new placement of garbage collector * we need RRDHOST->rrdvars for maintaining custom host variables * Health initialization needs the host->host_uuid * split STRING to its own files; no code changes other than that * initialize health unconditionally * unit tests do not pollute the global scope with their variables * Skip initialization when creating archived hosts on startup. When a child connects it will initialize properly Co-authored-by: Stelios Fragkakis <52996999+stelfrag@users.noreply.github.com> Co-authored-by: Vladimir Kobal <vlad@prokk.net>
439 lines
17 KiB
C
439 lines
17 KiB
C
// SPDX-License-Identifier: GPL-3.0-or-later
|
|
|
|
#include "health.h"
|
|
|
|
void health_string2json(BUFFER *wb, const char *prefix, const char *label, const char *value, const char *suffix) {
|
|
if(value && *value) {
|
|
buffer_sprintf(wb, "%s\"%s\":\"", prefix, label);
|
|
buffer_strcat_htmlescape(wb, value);
|
|
buffer_strcat(wb, "\"");
|
|
buffer_strcat(wb, suffix);
|
|
}
|
|
else
|
|
buffer_sprintf(wb, "%s\"%s\":null%s", prefix, label, suffix);
|
|
}
|
|
|
|
void health_alarm_entry2json_nolock(BUFFER *wb, ALARM_ENTRY *ae, RRDHOST *host) {
|
|
char *edit_command = ae->source ? health_edit_command_from_source(ae_source(ae)) : strdupz("UNKNOWN=0=UNKNOWN");
|
|
char config_hash_id[GUID_LEN + 1];
|
|
uuid_unparse_lower(ae->config_hash_id, config_hash_id);
|
|
|
|
buffer_sprintf(wb,
|
|
"\n\t{\n"
|
|
"\t\t\"hostname\": \"%s\",\n"
|
|
"\t\t\"utc_offset\": %d,\n"
|
|
"\t\t\"timezone\": \"%s\",\n"
|
|
"\t\t\"unique_id\": %u,\n"
|
|
"\t\t\"alarm_id\": %u,\n"
|
|
"\t\t\"alarm_event_id\": %u,\n"
|
|
"\t\t\"config_hash_id\": \"%s\",\n"
|
|
"\t\t\"name\": \"%s\",\n"
|
|
"\t\t\"chart\": \"%s\",\n"
|
|
"\t\t\"context\": \"%s\",\n"
|
|
"\t\t\"family\": \"%s\",\n"
|
|
"\t\t\"class\": \"%s\",\n"
|
|
"\t\t\"component\": \"%s\",\n"
|
|
"\t\t\"type\": \"%s\",\n"
|
|
"\t\t\"processed\": %s,\n"
|
|
"\t\t\"updated\": %s,\n"
|
|
"\t\t\"exec_run\": %lu,\n"
|
|
"\t\t\"exec_failed\": %s,\n"
|
|
"\t\t\"exec\": \"%s\",\n"
|
|
"\t\t\"recipient\": \"%s\",\n"
|
|
"\t\t\"exec_code\": %d,\n"
|
|
"\t\t\"source\": \"%s\",\n"
|
|
"\t\t\"command\": \"%s\",\n"
|
|
"\t\t\"units\": \"%s\",\n"
|
|
"\t\t\"when\": %lu,\n"
|
|
"\t\t\"duration\": %lu,\n"
|
|
"\t\t\"non_clear_duration\": %lu,\n"
|
|
"\t\t\"status\": \"%s\",\n"
|
|
"\t\t\"old_status\": \"%s\",\n"
|
|
"\t\t\"delay\": %d,\n"
|
|
"\t\t\"delay_up_to_timestamp\": %lu,\n"
|
|
"\t\t\"updated_by_id\": %u,\n"
|
|
"\t\t\"updates_id\": %u,\n"
|
|
"\t\t\"value_string\": \"%s\",\n"
|
|
"\t\t\"old_value_string\": \"%s\",\n"
|
|
"\t\t\"last_repeat\": \"%lu\",\n"
|
|
"\t\t\"silenced\": \"%s\",\n"
|
|
, rrdhost_hostname(host)
|
|
, host->utc_offset
|
|
, rrdhost_abbrev_timezone(host)
|
|
, ae->unique_id
|
|
, ae->alarm_id
|
|
, ae->alarm_event_id
|
|
, config_hash_id
|
|
, ae_name(ae)
|
|
, ae_chart_name(ae)
|
|
, ae_chart_context(ae)
|
|
, ae_family(ae)
|
|
, ae->classification?ae_classification(ae):"Unknown"
|
|
, ae->component?ae_component(ae):"Unknown"
|
|
, ae->type?ae_type(ae):"Unknown"
|
|
, (ae->flags & HEALTH_ENTRY_FLAG_PROCESSED)?"true":"false"
|
|
, (ae->flags & HEALTH_ENTRY_FLAG_UPDATED)?"true":"false"
|
|
, (unsigned long)ae->exec_run_timestamp
|
|
, (ae->flags & HEALTH_ENTRY_FLAG_EXEC_FAILED)?"true":"false"
|
|
, ae->exec?ae_exec(ae):string2str(host->health_default_exec)
|
|
, ae->recipient?ae_recipient(ae):string2str(host->health_default_recipient)
|
|
, ae->exec_code
|
|
, ae_source(ae)
|
|
, edit_command
|
|
, ae_units(ae)
|
|
, (unsigned long)ae->when
|
|
, (unsigned long)ae->duration
|
|
, (unsigned long)ae->non_clear_duration
|
|
, rrdcalc_status2string(ae->new_status)
|
|
, rrdcalc_status2string(ae->old_status)
|
|
, ae->delay
|
|
, (unsigned long)ae->delay_up_to_timestamp
|
|
, ae->updated_by_id
|
|
, ae->updates_id
|
|
, ae_new_value_string(ae)
|
|
, ae_old_value_string(ae)
|
|
, (unsigned long)ae->last_repeat
|
|
, (ae->flags & HEALTH_ENTRY_FLAG_SILENCED)?"true":"false"
|
|
);
|
|
|
|
health_string2json(wb, "\t\t", "info", ae->info ? ae_info(ae) : "", ",\n");
|
|
|
|
if(unlikely(ae->flags & HEALTH_ENTRY_FLAG_NO_CLEAR_NOTIFICATION)) {
|
|
buffer_strcat(wb, "\t\t\"no_clear_notification\": true,\n");
|
|
}
|
|
|
|
buffer_strcat(wb, "\t\t\"value\":");
|
|
buffer_rrd_value(wb, ae->new_value);
|
|
buffer_strcat(wb, ",\n");
|
|
|
|
buffer_strcat(wb, "\t\t\"old_value\":");
|
|
buffer_rrd_value(wb, ae->old_value);
|
|
buffer_strcat(wb, "\n");
|
|
|
|
buffer_strcat(wb, "\t}");
|
|
|
|
freez(edit_command);
|
|
}
|
|
|
|
void health_alarm_log2json(RRDHOST *host, BUFFER *wb, uint32_t after, char *chart) {
|
|
|
|
buffer_strcat(wb, "[");
|
|
|
|
unsigned int max = host->health_log.max;
|
|
unsigned int count = 0;
|
|
|
|
STRING *chart_string = string_strdupz(chart);
|
|
|
|
netdata_rwlock_rdlock(&host->health_log.alarm_log_rwlock);
|
|
|
|
ALARM_ENTRY *ae;
|
|
for (ae = host->health_log.alarms; ae && count < max; ae = ae->next) {
|
|
if ((ae->unique_id > after) && (!chart || chart_string == ae->chart)) {
|
|
if (likely(count))
|
|
buffer_strcat(wb, ",");
|
|
health_alarm_entry2json_nolock(wb, ae, host);
|
|
count++;
|
|
}
|
|
}
|
|
|
|
netdata_rwlock_unlock(&host->health_log.alarm_log_rwlock);
|
|
|
|
string_freez(chart_string);
|
|
|
|
buffer_strcat(wb, "\n]\n");
|
|
}
|
|
|
|
static inline void health_rrdcalc_values2json_nolock(RRDHOST *host, BUFFER *wb, RRDCALC *rc) {
|
|
(void)host;
|
|
buffer_sprintf(wb,
|
|
"\t\t\"%s.%s\": {\n"
|
|
"\t\t\t\"id\": %lu,\n"
|
|
, rrdcalc_chart_name(rc), rrdcalc_name(rc)
|
|
, (unsigned long)rc->id);
|
|
|
|
buffer_strcat(wb, "\t\t\t\"value\":");
|
|
buffer_rrd_value(wb, rc->value);
|
|
buffer_strcat(wb, ",\n");
|
|
|
|
buffer_strcat(wb, "\t\t\t\"last_updated\":");
|
|
buffer_sprintf(wb, "%lu", (unsigned long)rc->last_updated);
|
|
buffer_strcat(wb, ",\n");
|
|
|
|
buffer_sprintf(wb,
|
|
"\t\t\t\"status\": \"%s\"\n"
|
|
, rrdcalc_status2string(rc->status));
|
|
|
|
buffer_strcat(wb, "\t\t}");
|
|
}
|
|
|
|
static inline void health_rrdcalc2json_nolock(RRDHOST *host, BUFFER *wb, RRDCALC *rc) {
|
|
char value_string[100 + 1];
|
|
format_value_and_unit(value_string, 100, rc->value, rrdcalc_units(rc), -1);
|
|
|
|
char hash_id[GUID_LEN + 1];
|
|
uuid_unparse_lower(rc->config_hash_id, hash_id);
|
|
|
|
buffer_sprintf(wb,
|
|
"\t\t\"%s.%s\": {\n"
|
|
"\t\t\t\"id\": %lu,\n"
|
|
"\t\t\t\"config_hash_id\": \"%s\",\n"
|
|
"\t\t\t\"name\": \"%s\",\n"
|
|
"\t\t\t\"chart\": \"%s\",\n"
|
|
"\t\t\t\"family\": \"%s\",\n"
|
|
"\t\t\t\"class\": \"%s\",\n"
|
|
"\t\t\t\"component\": \"%s\",\n"
|
|
"\t\t\t\"type\": \"%s\",\n"
|
|
"\t\t\t\"active\": %s,\n"
|
|
"\t\t\t\"disabled\": %s,\n"
|
|
"\t\t\t\"silenced\": %s,\n"
|
|
"\t\t\t\"exec\": \"%s\",\n"
|
|
"\t\t\t\"recipient\": \"%s\",\n"
|
|
"\t\t\t\"source\": \"%s\",\n"
|
|
"\t\t\t\"units\": \"%s\",\n"
|
|
"\t\t\t\"info\": \"%s\",\n"
|
|
"\t\t\t\"status\": \"%s\",\n"
|
|
"\t\t\t\"last_status_change\": %lu,\n"
|
|
"\t\t\t\"last_updated\": %lu,\n"
|
|
"\t\t\t\"next_update\": %lu,\n"
|
|
"\t\t\t\"update_every\": %d,\n"
|
|
"\t\t\t\"delay_up_duration\": %d,\n"
|
|
"\t\t\t\"delay_down_duration\": %d,\n"
|
|
"\t\t\t\"delay_max_duration\": %d,\n"
|
|
"\t\t\t\"delay_multiplier\": %f,\n"
|
|
"\t\t\t\"delay\": %d,\n"
|
|
"\t\t\t\"delay_up_to_timestamp\": %lu,\n"
|
|
"\t\t\t\"warn_repeat_every\": \"%u\",\n"
|
|
"\t\t\t\"crit_repeat_every\": \"%u\",\n"
|
|
"\t\t\t\"value_string\": \"%s\",\n"
|
|
"\t\t\t\"last_repeat\": \"%lu\",\n"
|
|
"\t\t\t\"times_repeat\": %lu,\n"
|
|
, rrdcalc_chart_name(rc), rrdcalc_name(rc)
|
|
, (unsigned long)rc->id
|
|
, hash_id
|
|
, rrdcalc_name(rc)
|
|
, rrdcalc_chart_name(rc)
|
|
, (rc->rrdset)?rrdset_family(rc->rrdset):""
|
|
, rc->classification?rrdcalc_classification(rc):"Unknown"
|
|
, rc->component?rrdcalc_component(rc):"Unknown"
|
|
, rc->type?rrdcalc_type(rc):"Unknown"
|
|
, (rc->rrdset)?"true":"false"
|
|
, (rc->run_flags & RRDCALC_FLAG_DISABLED)?"true":"false"
|
|
, (rc->run_flags & RRDCALC_FLAG_SILENCED)?"true":"false"
|
|
, rc->exec?rrdcalc_exec(rc):string2str(host->health_default_exec)
|
|
, rc->recipient?rrdcalc_recipient(rc):string2str(host->health_default_recipient)
|
|
, rrdcalc_source(rc)
|
|
, rrdcalc_units(rc)
|
|
, rrdcalc_info(rc)
|
|
, rrdcalc_status2string(rc->status)
|
|
, (unsigned long)rc->last_status_change
|
|
, (unsigned long)rc->last_updated
|
|
, (unsigned long)rc->next_update
|
|
, rc->update_every
|
|
, rc->delay_up_duration
|
|
, rc->delay_down_duration
|
|
, rc->delay_max_duration
|
|
, rc->delay_multiplier
|
|
, rc->delay_last
|
|
, (unsigned long)rc->delay_up_to_timestamp
|
|
, rc->warn_repeat_every
|
|
, rc->crit_repeat_every
|
|
, value_string
|
|
, (unsigned long)rc->last_repeat
|
|
, (unsigned long)rc->times_repeat
|
|
);
|
|
|
|
if(unlikely(rc->options & RRDCALC_OPTION_NO_CLEAR_NOTIFICATION)) {
|
|
buffer_strcat(wb, "\t\t\t\"no_clear_notification\": true,\n");
|
|
}
|
|
|
|
if(RRDCALC_HAS_DB_LOOKUP(rc)) {
|
|
if(rc->dimensions)
|
|
health_string2json(wb, "\t\t\t", "lookup_dimensions", rrdcalc_dimensions(rc), ",\n");
|
|
|
|
buffer_sprintf(wb,
|
|
"\t\t\t\"db_after\": %lu,\n"
|
|
"\t\t\t\"db_before\": %lu,\n"
|
|
"\t\t\t\"lookup_method\": \"%s\",\n"
|
|
"\t\t\t\"lookup_after\": %d,\n"
|
|
"\t\t\t\"lookup_before\": %d,\n"
|
|
"\t\t\t\"lookup_options\": \"",
|
|
(unsigned long) rc->db_after,
|
|
(unsigned long) rc->db_before,
|
|
group_method2string(rc->group),
|
|
rc->after,
|
|
rc->before
|
|
);
|
|
buffer_data_options2string(wb, rc->options);
|
|
buffer_strcat(wb, "\",\n");
|
|
}
|
|
|
|
if(rc->calculation) {
|
|
health_string2json(wb, "\t\t\t", "calc", rc->calculation->source, ",\n");
|
|
health_string2json(wb, "\t\t\t", "calc_parsed", rc->calculation->parsed_as, ",\n");
|
|
}
|
|
|
|
if(rc->warning) {
|
|
health_string2json(wb, "\t\t\t", "warn", rc->warning->source, ",\n");
|
|
health_string2json(wb, "\t\t\t", "warn_parsed", rc->warning->parsed_as, ",\n");
|
|
}
|
|
|
|
if(rc->critical) {
|
|
health_string2json(wb, "\t\t\t", "crit", rc->critical->source, ",\n");
|
|
health_string2json(wb, "\t\t\t", "crit_parsed", rc->critical->parsed_as, ",\n");
|
|
}
|
|
|
|
buffer_strcat(wb, "\t\t\t\"green\":");
|
|
buffer_rrd_value(wb, rc->green);
|
|
buffer_strcat(wb, ",\n");
|
|
|
|
buffer_strcat(wb, "\t\t\t\"red\":");
|
|
buffer_rrd_value(wb, rc->red);
|
|
buffer_strcat(wb, ",\n");
|
|
|
|
buffer_strcat(wb, "\t\t\t\"value\":");
|
|
buffer_rrd_value(wb, rc->value);
|
|
buffer_strcat(wb, "\n");
|
|
|
|
buffer_strcat(wb, "\t\t}");
|
|
}
|
|
|
|
//void health_rrdcalctemplate2json_nolock(BUFFER *wb, RRDCALCTEMPLATE *rt) {
|
|
//
|
|
//}
|
|
|
|
void health_aggregate_alarms(RRDHOST *host, BUFFER *wb, BUFFER* contexts, RRDCALC_STATUS status) {
|
|
RRDCALC *rc;
|
|
int numberOfAlarms = 0;
|
|
char *tok = NULL;
|
|
char *p = NULL;
|
|
|
|
if (contexts) {
|
|
p = (char*)buffer_tostring(contexts);
|
|
while(p && *p && (tok = mystrsep(&p, ", |"))) {
|
|
if(!*tok) continue;
|
|
|
|
STRING *tok_string = string_strdupz(tok);
|
|
|
|
foreach_rrdcalc_in_rrdhost_read(host, rc) {
|
|
if(unlikely(!rc->rrdset || !rc->rrdset->last_collected_time.tv_sec))
|
|
continue;
|
|
if (unlikely(!rrdset_is_available_for_exporting_and_alarms(rc->rrdset)))
|
|
continue;
|
|
if(unlikely(rc->rrdset
|
|
&& rc->rrdset->context == tok_string
|
|
&& ((status==RRDCALC_STATUS_RAISED)?(rc->status >= RRDCALC_STATUS_WARNING):rc->status == status)))
|
|
numberOfAlarms++;
|
|
}
|
|
foreach_rrdcalc_in_rrdhost_done(rc);
|
|
|
|
string_freez(tok_string);
|
|
}
|
|
}
|
|
else {
|
|
foreach_rrdcalc_in_rrdhost_read(host, rc) {
|
|
if(unlikely(!rc->rrdset || !rc->rrdset->last_collected_time.tv_sec))
|
|
continue;
|
|
if (unlikely(!rrdset_is_available_for_exporting_and_alarms(rc->rrdset)))
|
|
continue;
|
|
if(unlikely((status==RRDCALC_STATUS_RAISED)?(rc->status >= RRDCALC_STATUS_WARNING):rc->status == status))
|
|
numberOfAlarms++;
|
|
}
|
|
foreach_rrdcalc_in_rrdhost_done(rc);
|
|
}
|
|
|
|
buffer_sprintf(wb, "%d", numberOfAlarms);
|
|
}
|
|
|
|
static void health_alarms2json_fill_alarms(RRDHOST *host, BUFFER *wb, int all, void (*fp)(RRDHOST *, BUFFER *, RRDCALC *)) {
|
|
RRDCALC *rc;
|
|
int i = 0;
|
|
foreach_rrdcalc_in_rrdhost_read(host, rc) {
|
|
if(unlikely(!rc->rrdset || !rc->rrdset->last_collected_time.tv_sec))
|
|
continue;
|
|
|
|
if (unlikely(!rrdset_is_available_for_exporting_and_alarms(rc->rrdset)))
|
|
continue;
|
|
|
|
if(likely(!all && !(rc->status == RRDCALC_STATUS_WARNING || rc->status == RRDCALC_STATUS_CRITICAL)))
|
|
continue;
|
|
|
|
if(likely(i)) buffer_strcat(wb, ",\n");
|
|
fp(host, wb, rc);
|
|
i++;
|
|
}
|
|
foreach_rrdcalc_in_rrdhost_done(rc);
|
|
}
|
|
|
|
void health_alarms2json(RRDHOST *host, BUFFER *wb, int all) {
|
|
buffer_sprintf(wb, "{\n\t\"hostname\": \"%s\","
|
|
"\n\t\"latest_alarm_log_unique_id\": %u,"
|
|
"\n\t\"status\": %s,"
|
|
"\n\t\"now\": %lu,"
|
|
"\n\t\"alarms\": {\n",
|
|
rrdhost_hostname(host),
|
|
(host->health_log.next_log_id > 0)?(host->health_log.next_log_id - 1):0,
|
|
host->health_enabled?"true":"false",
|
|
(unsigned long)now_realtime_sec());
|
|
|
|
health_alarms2json_fill_alarms(host, wb, all, health_rrdcalc2json_nolock);
|
|
|
|
// rrdhost_rdlock(host);
|
|
// buffer_strcat(wb, "\n\t},\n\t\"templates\": {");
|
|
// RRDCALCTEMPLATE *rt;
|
|
// for(rt = host->templates; rt ; rt = rt->next)
|
|
// health_rrdcalctemplate2json_nolock(wb, rt);
|
|
// rrdhost_unlock(host);
|
|
|
|
buffer_strcat(wb, "\n\t}\n}\n");
|
|
}
|
|
|
|
void health_alarms_values2json(RRDHOST *host, BUFFER *wb, int all) {
|
|
buffer_sprintf(wb, "{\n\t\"hostname\": \"%s\","
|
|
"\n\t\"alarms\": {\n",
|
|
rrdhost_hostname(host));
|
|
|
|
health_alarms2json_fill_alarms(host, wb, all, health_rrdcalc_values2json_nolock);
|
|
|
|
buffer_strcat(wb, "\n\t}\n}\n");
|
|
}
|
|
|
|
static int have_recent_alarm(RRDHOST *host, uint32_t alarm_id, time_t mark)
|
|
{
|
|
ALARM_ENTRY *ae = host->health_log.alarms;
|
|
|
|
while(ae) {
|
|
if (ae->alarm_id == alarm_id && ae->unique_id > mark &&
|
|
(ae->new_status != RRDCALC_STATUS_WARNING && ae->new_status != RRDCALC_STATUS_CRITICAL))
|
|
return 1;
|
|
ae = ae->next;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
void health_active_log_alarms_2json(RRDHOST *host, BUFFER *wb) {
|
|
netdata_rwlock_rdlock(&host->health_log.alarm_log_rwlock);
|
|
|
|
buffer_sprintf(wb, "[\n");
|
|
|
|
unsigned int max = host->health_log.max;
|
|
unsigned int count = 0;
|
|
ALARM_ENTRY *ae;
|
|
for(ae = host->health_log.alarms; ae && count < max ; ae = ae->next) {
|
|
if (!ae->updated_by_id &&
|
|
((ae->new_status == RRDCALC_STATUS_WARNING || ae->new_status == RRDCALC_STATUS_CRITICAL) ||
|
|
((ae->old_status == RRDCALC_STATUS_WARNING || ae->old_status == RRDCALC_STATUS_CRITICAL) &&
|
|
ae->new_status == RRDCALC_STATUS_REMOVED))) {
|
|
|
|
if (have_recent_alarm(host, ae->alarm_id, ae->unique_id))
|
|
continue;
|
|
|
|
if (likely(count))
|
|
buffer_strcat(wb, ",");
|
|
health_alarm_entry2json_nolock(wb, ae, host);
|
|
count++;
|
|
}
|
|
}
|
|
buffer_strcat(wb, "]");
|
|
|
|
netdata_rwlock_unlock(&host->health_log.alarm_log_rwlock);
|
|
}
|