mirror of
https://github.com/netdata/netdata.git
synced 2025-04-06 14:35:32 +00:00

* rrdset - in progress * rrdset optimal constructor; rrdset conflict * rrdset final touches * re-organization of rrdset object members * prevent use-after-free * dictionary dfe supports also counting of iterations * rrddim managed by dictionary * rrd.h cleanup * DICTIONARY_ITEM now is referencing actual dictionary items in the code * removed rrdset linked list * Revert "removed rrdset linked list" This reverts commit 690d6a588b4b99619c2c5e10f84e8f868ae6def5. * removed rrdset linked list * added comments * Switch chart uuid to static allocation in rrdset Remove unused functions * rrdset_archive() and friends... * always create rrdfamily * enable ml_free_dimension * rrddim_foreach done with dfe * most custom rrddim loops replaced with rrddim_foreach * removed accesses to rrddim->dimensions * removed locks that are no longer needed * rrdsetvar is now managed by the dictionary * set rrdset is rrdsetvar, fixes https://github.com/netdata/netdata/pull/13646#issuecomment-1242574853 * conflict callback of rrdsetvar now properly checks if it has to reset the variable * dictionary registered callbacks accept as first parameter the DICTIONARY_ITEM * dictionary dfe now uses internal counter to report; avoided excess variables defined with dfe * dictionary walkthrough callbacks get dictionary acquired items * dictionary reference counters that can be dupped from zero * added advanced functions for get and del * rrdvar managed by dictionaries * thread safety for rrdsetvar * faster rrdvar initialization * rrdvar string lengths should match in all add, del, get functions * rrdvar internals hidden from the rest of the world * rrdvar is now acquired throughout netdata * hide the internal structures of rrdsetvar * rrdsetvar is now acquired through out netdata * rrddimvar managed by dictionary; rrddimvar linked list removed; rrddimvar structures hidden from the rest of netdata * better error handling * dont create variables if not initialized for health * dont create variables if not initialized for health again * rrdfamily is now managed by dictionaries; references of it are acquired dictionary items * type checking on acquired objects * rrdcalc renaming of functions * type checking for rrdfamily_acquired * rrdcalc managed by dictionaries * rrdcalc double free fix * host rrdvars is always needed * attempt to fix deadlock 1 * attempt to fix deadlock 2 * Remove unused variable * attempt to fix deadlock 3 * snprintfz * rrdcalc index in rrdset fix * Stop storing active charts and computing chart hashes * Remove store active chart function * Remove compute chart hash function * Remove sql_store_chart_hash function * Remove store_active_dimension function * dictionary delayed destruction * formatting and cleanup * zero dictionary base on rrdsetvar * added internal error to log delayed destructions of dictionaries * typo in rrddimvar * added debugging info to dictionary * debug info * fix for rrdcalc keys being empty * remove forgotten unlock * remove deadlock * Switch to metadata version 5 and drop chart_hash chart_hash_map chart_active dimension_active v_chart_hash * SQL cosmetic changes * do not busy wait while destroying a referenced dictionary * remove deadlock * code cleanup; re-organization; * fast cleanup and flushing of dictionaries * number formatting fixes * do not delete configured alerts when archiving a chart * rrddim obsolete linked list management outside dictionaries * removed duplicate contexts call * fix crash when rrdfamily is not initialized * dont keep rrddimvar referenced * properly cleanup rrdvar * removed some locks * Do not attempt to cleanup chart_hash / chart_hash_map * rrdcalctemplate managed by dictionary * register callbacks on the right dictionary * removed some more locks * rrdcalc secondary index replaced with linked-list; rrdcalc labels updates are now executed by health thread * when looking up for an alarm look using both chart id and chart name * host initialization a bit more modular * init rrdlabels on host update * preparation for dictionary views * improved comment * unused variables without internal checks * service threads isolation and worker info * more worker info in service thread * thread cancelability debugging with internal checks * strings data races addressed; fixes https://github.com/netdata/netdata/issues/13647 * dictionary modularization * Remove unused SQL statement definition * unit-tested thread safety of dictionaries; removed data race conditions on dictionaries and strings; dictionaries now can detect if the caller is holds a write lock and automatically all the calls become their unsafe versions; all direct calls to unsafe version is eliminated * remove worker_is_idle() from the exit of service functions, because we lose the lock time between loops * rewritten dictionary to have 2 separate locks, one for indexing and another for traversal * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/proc.plugin/proc_net_dev.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * fix memory leak in rrdset cache_dir * minor dictionary changes * dont use index locks in single threaded * obsolete dict option * rrddim options and flags separation; rrdset_done() optimization to keep array of reference pointers to rrddim; * fix jump on uninitialized value in dictionary; remove double free of cache_dir * addressed codacy findings * removed debugging code * use the private refcount on dictionaries * make dictionary item desctructors work on dictionary destruction; strictier control on dictionary API; proper cleanup sequence on rrddim; * more dictionary statistics * global statistics about dictionary operations, memory, items, callbacks * dictionary support for views - missing the public API * removed warning about unused parameter * chart and context name for cloud * chart and context name for cloud, again * dictionary statistics fixed; first implementation of dictionary views - not currently used * only the master can globally delete an item * context needs netdata prefix * fix context and chart it of spins * fix for host variables when health is not enabled * run garbage collector on item insert too * Fix info message; remove extra "using" * update dict unittest for new placement of garbage collector * we need RRDHOST->rrdvars for maintaining custom host variables * Health initialization needs the host->host_uuid * split STRING to its own files; no code changes other than that * initialize health unconditionally * unit tests do not pollute the global scope with their variables * Skip initialization when creating archived hosts on startup. When a child connects it will initialize properly Co-authored-by: Stelios Fragkakis <52996999+stelfrag@users.noreply.github.com> Co-authored-by: Vladimir Kobal <vlad@prokk.net>
246 lines
7.9 KiB
C
246 lines
7.9 KiB
C
// SPDX-License-Identifier: GPL-3.0-or-later
|
|
|
|
#include "plugin_proc.h"
|
|
|
|
#define PLUGIN_PROC_MODULE_SOFTIRQS_NAME "/proc/softirqs"
|
|
|
|
#define MAX_INTERRUPT_NAME 50
|
|
|
|
struct cpu_interrupt {
|
|
unsigned long long value;
|
|
RRDDIM *rd;
|
|
};
|
|
|
|
struct interrupt {
|
|
int used;
|
|
char *id;
|
|
char name[MAX_INTERRUPT_NAME + 1];
|
|
RRDDIM *rd;
|
|
unsigned long long total;
|
|
struct cpu_interrupt cpu[];
|
|
};
|
|
|
|
// since each interrupt is variable in size
|
|
// we use this to calculate its record size
|
|
#define recordsize(cpus) (sizeof(struct interrupt) + ((cpus) * sizeof(struct cpu_interrupt)))
|
|
|
|
// given a base, get a pointer to each record
|
|
#define irrindex(base, line, cpus) ((struct interrupt *)&((char *)(base))[(line) * recordsize(cpus)])
|
|
|
|
static inline struct interrupt *get_interrupts_array(size_t lines, int cpus) {
|
|
static struct interrupt *irrs = NULL;
|
|
static size_t allocated = 0;
|
|
|
|
if(unlikely(lines != allocated)) {
|
|
uint32_t l;
|
|
int c;
|
|
|
|
irrs = (struct interrupt *)reallocz(irrs, lines * recordsize(cpus));
|
|
|
|
// reset all interrupt RRDDIM pointers as any line could have shifted
|
|
for(l = 0; l < lines ;l++) {
|
|
struct interrupt *irr = irrindex(irrs, l, cpus);
|
|
irr->rd = NULL;
|
|
irr->name[0] = '\0';
|
|
for(c = 0; c < cpus ;c++)
|
|
irr->cpu[c].rd = NULL;
|
|
}
|
|
|
|
allocated = lines;
|
|
}
|
|
|
|
return irrs;
|
|
}
|
|
|
|
int do_proc_softirqs(int update_every, usec_t dt) {
|
|
(void)dt;
|
|
static procfile *ff = NULL;
|
|
static int cpus = -1, do_per_core = CONFIG_BOOLEAN_INVALID;
|
|
struct interrupt *irrs = NULL;
|
|
|
|
if(unlikely(do_per_core == CONFIG_BOOLEAN_INVALID))
|
|
do_per_core = config_get_boolean_ondemand("plugin:proc:/proc/softirqs", "interrupts per core", CONFIG_BOOLEAN_AUTO);
|
|
|
|
if(unlikely(!ff)) {
|
|
char filename[FILENAME_MAX + 1];
|
|
snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, "/proc/softirqs");
|
|
ff = procfile_open(config_get("plugin:proc:/proc/softirqs", "filename to monitor", filename), " \t:", PROCFILE_FLAG_DEFAULT);
|
|
if(unlikely(!ff)) return 1;
|
|
}
|
|
|
|
ff = procfile_readall(ff);
|
|
if(unlikely(!ff)) return 0; // we return 0, so that we will retry to open it next time
|
|
|
|
size_t lines = procfile_lines(ff), l;
|
|
size_t words = procfile_linewords(ff, 0);
|
|
|
|
if(unlikely(!lines)) {
|
|
error("Cannot read /proc/softirqs, zero lines reported.");
|
|
return 1;
|
|
}
|
|
|
|
// find how many CPUs are there
|
|
if(unlikely(cpus == -1)) {
|
|
uint32_t w;
|
|
cpus = 0;
|
|
for(w = 0; w < words ; w++) {
|
|
if(likely(strncmp(procfile_lineword(ff, 0, w), "CPU", 3) == 0))
|
|
cpus++;
|
|
}
|
|
}
|
|
|
|
if(unlikely(!cpus)) {
|
|
error("PLUGIN: PROC_SOFTIRQS: Cannot find the number of CPUs in /proc/softirqs");
|
|
return 1;
|
|
}
|
|
|
|
// allocate the size we need;
|
|
irrs = get_interrupts_array(lines, cpus);
|
|
irrs[0].used = 0;
|
|
|
|
// loop through all lines
|
|
for(l = 1; l < lines ;l++) {
|
|
struct interrupt *irr = irrindex(irrs, l, cpus);
|
|
irr->used = 0;
|
|
irr->total = 0;
|
|
|
|
words = procfile_linewords(ff, l);
|
|
if(unlikely(!words)) continue;
|
|
|
|
irr->id = procfile_lineword(ff, l, 0);
|
|
if(unlikely(!irr->id || !irr->id[0])) continue;
|
|
|
|
int c;
|
|
for(c = 0; c < cpus ;c++) {
|
|
if(likely((c + 1) < (int)words))
|
|
irr->cpu[c].value = str2ull(procfile_lineword(ff, l, (uint32_t)(c + 1)));
|
|
else
|
|
irr->cpu[c].value = 0;
|
|
|
|
irr->total += irr->cpu[c].value;
|
|
}
|
|
|
|
strncpyz(irr->name, irr->id, MAX_INTERRUPT_NAME);
|
|
|
|
irr->used = 1;
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
static RRDSET *st_system_softirqs = NULL;
|
|
if(unlikely(!st_system_softirqs))
|
|
st_system_softirqs = rrdset_create_localhost(
|
|
"system"
|
|
, "softirqs"
|
|
, NULL
|
|
, "softirqs"
|
|
, NULL
|
|
, "System softirqs"
|
|
, "softirqs/s"
|
|
, PLUGIN_PROC_NAME
|
|
, PLUGIN_PROC_MODULE_SOFTIRQS_NAME
|
|
, NETDATA_CHART_PRIO_SYSTEM_SOFTIRQS
|
|
, update_every
|
|
, RRDSET_TYPE_STACKED
|
|
);
|
|
else
|
|
rrdset_next(st_system_softirqs);
|
|
|
|
for(l = 0; l < lines ;l++) {
|
|
struct interrupt *irr = irrindex(irrs, l, cpus);
|
|
|
|
if(irr->used && irr->total) {
|
|
// some interrupt may have changed without changing the total number of lines
|
|
// if the same number of interrupts have been added and removed between two
|
|
// calls of this function.
|
|
if(unlikely(!irr->rd || strncmp(irr->name, rrddim_name(irr->rd), MAX_INTERRUPT_NAME) != 0)) {
|
|
irr->rd = rrddim_add(st_system_softirqs, irr->id, irr->name, 1, 1, RRD_ALGORITHM_INCREMENTAL);
|
|
rrddim_reset_name(st_system_softirqs, irr->rd, irr->name);
|
|
|
|
// also reset per cpu RRDDIMs to avoid repeating strncmp() in the per core loop
|
|
if(likely(do_per_core != CONFIG_BOOLEAN_NO)) {
|
|
int c;
|
|
for(c = 0; c < cpus; c++) irr->cpu[c].rd = NULL;
|
|
}
|
|
}
|
|
|
|
rrddim_set_by_pointer(st_system_softirqs, irr->rd, irr->total);
|
|
}
|
|
}
|
|
|
|
rrdset_done(st_system_softirqs);
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
if(do_per_core != CONFIG_BOOLEAN_NO) {
|
|
static RRDSET **core_st = NULL;
|
|
static int old_cpus = 0;
|
|
|
|
if(old_cpus < cpus) {
|
|
core_st = reallocz(core_st, sizeof(RRDSET *) * cpus);
|
|
memset(&core_st[old_cpus], 0, sizeof(RRDSET *) * (cpus - old_cpus));
|
|
old_cpus = cpus;
|
|
}
|
|
|
|
int c;
|
|
|
|
for(c = 0; c < cpus ; c++) {
|
|
if(unlikely(!core_st[c])) {
|
|
// find if everything is just zero
|
|
unsigned long long core_sum = 0;
|
|
|
|
for (l = 0; l < lines; l++) {
|
|
struct interrupt *irr = irrindex(irrs, l, cpus);
|
|
if (unlikely(!irr->used)) continue;
|
|
core_sum += irr->cpu[c].value;
|
|
}
|
|
|
|
if (unlikely(core_sum == 0)) continue; // try next core
|
|
|
|
char id[50 + 1];
|
|
snprintfz(id, 50, "cpu%d_softirqs", c);
|
|
|
|
char title[100 + 1];
|
|
snprintfz(title, 100, "CPU softirqs");
|
|
|
|
core_st[c] = rrdset_create_localhost(
|
|
"cpu"
|
|
, id
|
|
, NULL
|
|
, "softirqs"
|
|
, "cpu.softirqs"
|
|
, title
|
|
, "softirqs/s"
|
|
, PLUGIN_PROC_NAME
|
|
, PLUGIN_PROC_MODULE_SOFTIRQS_NAME
|
|
, NETDATA_CHART_PRIO_SOFTIRQS_PER_CORE + c
|
|
, update_every
|
|
, RRDSET_TYPE_STACKED
|
|
);
|
|
|
|
char core[50+1];
|
|
snprintfz(core, 50, "cpu%d", c);
|
|
rrdlabels_add(core_st[c]->rrdlabels, "cpu", core, RRDLABEL_SRC_AUTO);
|
|
}
|
|
else
|
|
rrdset_next(core_st[c]);
|
|
|
|
for(l = 0; l < lines ;l++) {
|
|
struct interrupt *irr = irrindex(irrs, l, cpus);
|
|
|
|
if(irr->used && (do_per_core == CONFIG_BOOLEAN_YES || irr->cpu[c].value)) {
|
|
if(unlikely(!irr->cpu[c].rd)) {
|
|
irr->cpu[c].rd = rrddim_add(core_st[c], irr->id, irr->name, 1, 1, RRD_ALGORITHM_INCREMENTAL);
|
|
rrddim_reset_name(core_st[c], irr->cpu[c].rd, irr->name);
|
|
}
|
|
|
|
rrddim_set_by_pointer(core_st[c], irr->cpu[c].rd, irr->cpu[c].value);
|
|
}
|
|
}
|
|
|
|
rrdset_done(core_st[c]);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|