mirror of
https://github.com/netdata/netdata.git
synced 2025-04-06 14:35:32 +00:00

* rrdset - in progress * rrdset optimal constructor; rrdset conflict * rrdset final touches * re-organization of rrdset object members * prevent use-after-free * dictionary dfe supports also counting of iterations * rrddim managed by dictionary * rrd.h cleanup * DICTIONARY_ITEM now is referencing actual dictionary items in the code * removed rrdset linked list * Revert "removed rrdset linked list" This reverts commit 690d6a588b4b99619c2c5e10f84e8f868ae6def5. * removed rrdset linked list * added comments * Switch chart uuid to static allocation in rrdset Remove unused functions * rrdset_archive() and friends... * always create rrdfamily * enable ml_free_dimension * rrddim_foreach done with dfe * most custom rrddim loops replaced with rrddim_foreach * removed accesses to rrddim->dimensions * removed locks that are no longer needed * rrdsetvar is now managed by the dictionary * set rrdset is rrdsetvar, fixes https://github.com/netdata/netdata/pull/13646#issuecomment-1242574853 * conflict callback of rrdsetvar now properly checks if it has to reset the variable * dictionary registered callbacks accept as first parameter the DICTIONARY_ITEM * dictionary dfe now uses internal counter to report; avoided excess variables defined with dfe * dictionary walkthrough callbacks get dictionary acquired items * dictionary reference counters that can be dupped from zero * added advanced functions for get and del * rrdvar managed by dictionaries * thread safety for rrdsetvar * faster rrdvar initialization * rrdvar string lengths should match in all add, del, get functions * rrdvar internals hidden from the rest of the world * rrdvar is now acquired throughout netdata * hide the internal structures of rrdsetvar * rrdsetvar is now acquired through out netdata * rrddimvar managed by dictionary; rrddimvar linked list removed; rrddimvar structures hidden from the rest of netdata * better error handling * dont create variables if not initialized for health * dont create variables if not initialized for health again * rrdfamily is now managed by dictionaries; references of it are acquired dictionary items * type checking on acquired objects * rrdcalc renaming of functions * type checking for rrdfamily_acquired * rrdcalc managed by dictionaries * rrdcalc double free fix * host rrdvars is always needed * attempt to fix deadlock 1 * attempt to fix deadlock 2 * Remove unused variable * attempt to fix deadlock 3 * snprintfz * rrdcalc index in rrdset fix * Stop storing active charts and computing chart hashes * Remove store active chart function * Remove compute chart hash function * Remove sql_store_chart_hash function * Remove store_active_dimension function * dictionary delayed destruction * formatting and cleanup * zero dictionary base on rrdsetvar * added internal error to log delayed destructions of dictionaries * typo in rrddimvar * added debugging info to dictionary * debug info * fix for rrdcalc keys being empty * remove forgotten unlock * remove deadlock * Switch to metadata version 5 and drop chart_hash chart_hash_map chart_active dimension_active v_chart_hash * SQL cosmetic changes * do not busy wait while destroying a referenced dictionary * remove deadlock * code cleanup; re-organization; * fast cleanup and flushing of dictionaries * number formatting fixes * do not delete configured alerts when archiving a chart * rrddim obsolete linked list management outside dictionaries * removed duplicate contexts call * fix crash when rrdfamily is not initialized * dont keep rrddimvar referenced * properly cleanup rrdvar * removed some locks * Do not attempt to cleanup chart_hash / chart_hash_map * rrdcalctemplate managed by dictionary * register callbacks on the right dictionary * removed some more locks * rrdcalc secondary index replaced with linked-list; rrdcalc labels updates are now executed by health thread * when looking up for an alarm look using both chart id and chart name * host initialization a bit more modular * init rrdlabels on host update * preparation for dictionary views * improved comment * unused variables without internal checks * service threads isolation and worker info * more worker info in service thread * thread cancelability debugging with internal checks * strings data races addressed; fixes https://github.com/netdata/netdata/issues/13647 * dictionary modularization * Remove unused SQL statement definition * unit-tested thread safety of dictionaries; removed data race conditions on dictionaries and strings; dictionaries now can detect if the caller is holds a write lock and automatically all the calls become their unsafe versions; all direct calls to unsafe version is eliminated * remove worker_is_idle() from the exit of service functions, because we lose the lock time between loops * rewritten dictionary to have 2 separate locks, one for indexing and another for traversal * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/cgroups.plugin/sys_fs_cgroup.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * Update collectors/proc.plugin/proc_net_dev.c Co-authored-by: Vladimir Kobal <vlad@prokk.net> * fix memory leak in rrdset cache_dir * minor dictionary changes * dont use index locks in single threaded * obsolete dict option * rrddim options and flags separation; rrdset_done() optimization to keep array of reference pointers to rrddim; * fix jump on uninitialized value in dictionary; remove double free of cache_dir * addressed codacy findings * removed debugging code * use the private refcount on dictionaries * make dictionary item desctructors work on dictionary destruction; strictier control on dictionary API; proper cleanup sequence on rrddim; * more dictionary statistics * global statistics about dictionary operations, memory, items, callbacks * dictionary support for views - missing the public API * removed warning about unused parameter * chart and context name for cloud * chart and context name for cloud, again * dictionary statistics fixed; first implementation of dictionary views - not currently used * only the master can globally delete an item * context needs netdata prefix * fix context and chart it of spins * fix for host variables when health is not enabled * run garbage collector on item insert too * Fix info message; remove extra "using" * update dict unittest for new placement of garbage collector * we need RRDHOST->rrdvars for maintaining custom host variables * Health initialization needs the host->host_uuid * split STRING to its own files; no code changes other than that * initialize health unconditionally * unit tests do not pollute the global scope with their variables * Skip initialization when creating archived hosts on startup. When a child connects it will initialize properly Co-authored-by: Stelios Fragkakis <52996999+stelfrag@users.noreply.github.com> Co-authored-by: Vladimir Kobal <vlad@prokk.net>
157 lines
3.7 KiB
C++
157 lines
3.7 KiB
C++
// SPDX-License-Identifier: GPL-3.0-or-later
|
|
|
|
#ifndef ML_DIMENSION_H
|
|
#define ML_DIMENSION_H
|
|
|
|
#include "BitBufferCounter.h"
|
|
#include "Config.h"
|
|
|
|
#include "ml-private.h"
|
|
|
|
namespace ml {
|
|
|
|
class RrdDimension {
|
|
public:
|
|
RrdDimension(RRDDIM *RD) : RD(RD), Ops(&RD->tiers[0]->query_ops) { }
|
|
|
|
RRDDIM *getRD() const { return RD; }
|
|
|
|
time_t latestTime() { return Ops->latest_time(RD->tiers[0]->db_metric_handle); }
|
|
|
|
time_t oldestTime() { return Ops->oldest_time(RD->tiers[0]->db_metric_handle); }
|
|
|
|
unsigned updateEvery() const { return RD->update_every; }
|
|
|
|
const std::string getID() const {
|
|
RRDSET *RS = RD->rrdset;
|
|
|
|
std::stringstream SS;
|
|
SS << rrdset_context(RS) << "|" << rrdset_id(RS) << "|" << rrddim_name(RD);
|
|
return SS.str();
|
|
}
|
|
|
|
bool isActive() const {
|
|
if (rrdset_flag_check(RD->rrdset, RRDSET_FLAG_OBSOLETE))
|
|
return false;
|
|
|
|
if (rrddim_flag_check(RD, RRDDIM_FLAG_OBSOLETE))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
void setAnomalyRateRD(RRDDIM *ARRD) { AnomalyRateRD = ARRD; }
|
|
RRDDIM *getAnomalyRateRD() const { return AnomalyRateRD; }
|
|
|
|
void setAnomalyRateRDName(const char *Name) const {
|
|
rrddim_reset_name(AnomalyRateRD->rrdset, AnomalyRateRD, Name);
|
|
}
|
|
|
|
virtual ~RrdDimension() {}
|
|
|
|
private:
|
|
RRDDIM *RD;
|
|
RRDDIM *AnomalyRateRD;
|
|
|
|
struct rrddim_query_ops *Ops;
|
|
|
|
std::string ID;
|
|
};
|
|
|
|
enum class MLResult {
|
|
Success = 0,
|
|
MissingData,
|
|
NaN,
|
|
};
|
|
|
|
class TrainableDimension : public RrdDimension {
|
|
public:
|
|
TrainableDimension(RRDDIM *RD) :
|
|
RrdDimension(RD), TrainEvery(Cfg.TrainEvery * updateEvery()) {}
|
|
|
|
MLResult trainModel();
|
|
|
|
CalculatedNumber computeAnomalyScore(SamplesBuffer &SB) {
|
|
return Trained ? KM.anomalyScore(SB) : 0.0;
|
|
}
|
|
|
|
bool shouldTrain(const TimePoint &TP) const {
|
|
if (ConstantModel)
|
|
return false;
|
|
|
|
return (LastTrainedAt + TrainEvery) < TP;
|
|
}
|
|
|
|
bool isTrained() const { return Trained; }
|
|
|
|
private:
|
|
std::pair<CalculatedNumber *, size_t> getCalculatedNumbers();
|
|
|
|
public:
|
|
TimePoint LastTrainedAt{Seconds{0}};
|
|
|
|
protected:
|
|
std::atomic<bool> ConstantModel{false};
|
|
|
|
private:
|
|
Seconds TrainEvery;
|
|
KMeans KM;
|
|
|
|
std::atomic<bool> Trained{false};
|
|
};
|
|
|
|
class PredictableDimension : public TrainableDimension {
|
|
public:
|
|
PredictableDimension(RRDDIM *RD) : TrainableDimension(RD) {}
|
|
|
|
std::pair<MLResult, bool> predict();
|
|
|
|
void addValue(CalculatedNumber Value, bool Exists);
|
|
|
|
bool isAnomalous() { return AnomalyBit; }
|
|
|
|
void updateAnomalyBitCounter(RRDSET *RS, unsigned Elapsed, bool IsAnomalous) {
|
|
AnomalyBitCounter += IsAnomalous;
|
|
|
|
if (Elapsed == Cfg.DBEngineAnomalyRateEvery) {
|
|
double AR = static_cast<double>(AnomalyBitCounter) / Cfg.DBEngineAnomalyRateEvery;
|
|
rrddim_set_by_pointer(RS, getAnomalyRateRD(), AR * 1000);
|
|
AnomalyBitCounter = 0;
|
|
}
|
|
}
|
|
|
|
private:
|
|
CalculatedNumber AnomalyScore{0.0};
|
|
std::atomic<bool> AnomalyBit{false};
|
|
unsigned AnomalyBitCounter{0};
|
|
|
|
std::vector<CalculatedNumber> CNs;
|
|
};
|
|
|
|
class DetectableDimension : public PredictableDimension {
|
|
public:
|
|
DetectableDimension(RRDDIM *RD) : PredictableDimension(RD) {}
|
|
|
|
std::pair<bool, double> detect(size_t WindowLength, bool Reset) {
|
|
bool AnomalyBit = isAnomalous();
|
|
|
|
if (Reset)
|
|
NumSetBits = BBC.numSetBits();
|
|
|
|
NumSetBits += AnomalyBit;
|
|
BBC.insert(AnomalyBit);
|
|
|
|
double AnomalyRate = static_cast<double>(NumSetBits) / WindowLength;
|
|
return { AnomalyBit, AnomalyRate };
|
|
}
|
|
|
|
private:
|
|
BitBufferCounter BBC{static_cast<size_t>(Cfg.ADMinWindowSize)};
|
|
size_t NumSetBits{0};
|
|
};
|
|
|
|
using Dimension = DetectableDimension;
|
|
|
|
} // namespace ml
|
|
|
|
#endif /* ML_DIMENSION_H */
|