mirror of
https://github.com/netdata/netdata.git
synced 2025-04-16 02:24:15 +00:00

* rrdfamily * rrddim * rrdset plugin and module names * rrdset units * rrdset type * rrdset family * rrdset title * rrdset title more * rrdset context * rrdcalctemplate context and removal of context hash from rrdset * strings statistics * rrdset name * rearranged members of rrdset * eliminate rrdset name hash; rrdcalc chart converted to STRING * rrdset id, eliminated rrdset hash * rrdcalc, alarm_entry, alert_config and some of rrdcalctemplate * rrdcalctemplate * rrdvar * eval_variable * rrddimvar and rrdsetvar * rrdhost hostname, os and tags * fix master commits * added thread cache; implemented string_dup without locks * faster thread cache * rrdset and rrddim now use dictionaries for indexing * rrdhost now uses dictionary * rrdfamily now uses DICTIONARY * rrdvar using dictionary instead of AVL * allocate the right size to rrdvar flag members * rrdhost remaining char * members to STRING * * better error handling on indexing * strings now use a read/write lock to allow parallel searches to the index * removed AVL support from dictionaries; implemented STRING with native Judy calls * string releases should be negative * only 31 bits are allowed for enum flags * proper locking on strings * string threading unittest and fixes * fix lgtm finding * fixed naming * stream chart/dimension definitions at the beginning of a streaming session * thread stack variable is undefined on thread cancel * rrdcontext garbage collect per host on startup * worker control in garbage collection * relaxed deletion of rrdmetrics * type checking on dictfe * netdata chart to monitor rrdcontext triggers * Group chart label updates * rrdcontext better handling of collected rrdsets * rrdpush incremental transmition of definitions should use as much buffer as possible * require 1MB per chart * empty the sender buffer before enabling metrics streaming * fill up to 50% of buffer * reset signaling metrics sending * use the shared variable for status * use separate host flag for enabling streaming of metrics * make sure the flag is clear * add logging for streaming * add logging for streaming on buffer overflow * circular_buffer proper sizing * removed obsolete logs * do not execute worker jobs if not necessary * better messages about compression disabling * proper use of flags and updating rrdset last access time every time the obsoletion flag is flipped * monitor stream sender used buffer ratio * Update exporting unit tests * no need to compare label value with strcmp * streaming send workers now monitor bandwidth * workers now use strings * streaming receiver monitors incoming bandwidth * parser shift of worker ids * minor fixes * Group chart label updates * Populate context with dimensions that have data * Fix chart id * better shift of parser worker ids * fix for streaming compression * properly count received bytes * ensure LZ4 compression ring buffer does not wrap prematurely * do not stream empty charts; do not process empty instances in rrdcontext * need_to_send_chart_definition() does not need an rrdset lock any more * rrdcontext objects are collected, after data have been written to the db * better logging of RRDCONTEXT transitions * always set all variables needed by the worker utilization charts * implemented double linked list for most objects; eliminated alarm indexes from rrdhost; and many more fixes * lockless strings design - string_dup() and string_freez() are totally lockless when they dont need to touch Judy - only Judy is protected with a read/write lock * STRING code re-organization for clarity * thread_cache improvements; double numbers precision on worker threads * STRING_ENTRY now shadown STRING, so no duplicate definition is required; string_length() renamed to string_strlen() to follow the paradigm of all other functions, STRING internal statistics are now only compiled with NETDATA_INTERNAL_CHECKS * rrdhost index by hostname now cleans up; aclk queries of archieved hosts do not index hosts * Add index to speed up database context searches * Removed last_updated optimization (was also buggy after latest merge with master) Co-authored-by: Stelios Fragkakis <52996999+stelfrag@users.noreply.github.com> Co-authored-by: Vladimir Kobal <vlad@prokk.net>
247 lines
7.9 KiB
C
247 lines
7.9 KiB
C
// SPDX-License-Identifier: GPL-3.0-or-later
|
|
|
|
#ifndef NETDATA_SQLITE_ACLK_H
|
|
#define NETDATA_SQLITE_ACLK_H
|
|
|
|
#include "sqlite3.h"
|
|
|
|
// TODO: To be added
|
|
#include "../../aclk/schema-wrappers/chart_stream.h"
|
|
|
|
#ifndef ACLK_MAX_CHART_BATCH
|
|
#define ACLK_MAX_CHART_BATCH (200)
|
|
#endif
|
|
#ifndef ACLK_MAX_CHART_BATCH_COUNT
|
|
#define ACLK_MAX_CHART_BATCH_COUNT (10)
|
|
#endif
|
|
#define ACLK_MAX_ALERT_UPDATES (5)
|
|
#define ACLK_DATABASE_CLEANUP_FIRST (60)
|
|
#define ACLK_DATABASE_ROTATION_DELAY (180)
|
|
#define ACLK_DATABASE_RETENTION_RETRY (60)
|
|
#define ACLK_DATABASE_CLEANUP_INTERVAL (3600)
|
|
#define ACLK_DATABASE_ROTATION_INTERVAL (3600)
|
|
#define ACLK_DELETE_ACK_INTERNAL (600)
|
|
#define ACLK_DELETE_ACK_ALERTS_INTERNAL (86400)
|
|
#define ACLK_AUTO_MARK_SUBMIT_INTERVAL (3600)
|
|
#define ACLK_AUTO_MARK_UPDATED_INTERVAL (1800)
|
|
#define ACLK_SYNC_QUERY_SIZE 512
|
|
|
|
struct aclk_completion {
|
|
uv_mutex_t mutex;
|
|
uv_cond_t cond;
|
|
volatile unsigned completed;
|
|
};
|
|
|
|
static inline void init_aclk_completion(struct aclk_completion *p)
|
|
{
|
|
p->completed = 0;
|
|
fatal_assert(0 == uv_cond_init(&p->cond));
|
|
fatal_assert(0 == uv_mutex_init(&p->mutex));
|
|
}
|
|
|
|
static inline void destroy_aclk_completion(struct aclk_completion *p)
|
|
{
|
|
uv_cond_destroy(&p->cond);
|
|
uv_mutex_destroy(&p->mutex);
|
|
}
|
|
|
|
static inline void wait_for_aclk_completion(struct aclk_completion *p)
|
|
{
|
|
uv_mutex_lock(&p->mutex);
|
|
while (0 == p->completed) {
|
|
uv_cond_wait(&p->cond, &p->mutex);
|
|
}
|
|
fatal_assert(1 == p->completed);
|
|
uv_mutex_unlock(&p->mutex);
|
|
}
|
|
|
|
static inline void aclk_complete(struct aclk_completion *p)
|
|
{
|
|
uv_mutex_lock(&p->mutex);
|
|
p->completed = 1;
|
|
uv_mutex_unlock(&p->mutex);
|
|
uv_cond_broadcast(&p->cond);
|
|
}
|
|
|
|
extern uv_mutex_t aclk_async_lock;
|
|
|
|
static inline void uuid_unparse_lower_fix(uuid_t *uuid, char *out)
|
|
{
|
|
uuid_unparse_lower(*uuid, out);
|
|
out[8] = '_';
|
|
out[13] = '_';
|
|
out[18] = '_';
|
|
out[23] = '_';
|
|
}
|
|
|
|
static inline char *get_str_from_uuid(uuid_t *uuid)
|
|
{
|
|
char uuid_str[GUID_LEN + 1];
|
|
if (unlikely(!uuid)) {
|
|
uuid_t zero_uuid;
|
|
uuid_clear(zero_uuid);
|
|
uuid_unparse_lower(zero_uuid, uuid_str);
|
|
}
|
|
else
|
|
uuid_unparse_lower(*uuid, uuid_str);
|
|
return strdupz(uuid_str);
|
|
}
|
|
|
|
#define TABLE_ACLK_CHART "CREATE TABLE IF NOT EXISTS aclk_chart_%s (sequence_id INTEGER PRIMARY KEY, " \
|
|
"date_created, date_updated, date_submitted, status, uuid, type, unique_id, " \
|
|
"update_count default 1, unique(uuid, status));"
|
|
|
|
#define TABLE_ACLK_CHART_PAYLOAD "CREATE TABLE IF NOT EXISTS aclk_chart_payload_%s (unique_id BLOB PRIMARY KEY, " \
|
|
"uuid, claim_id, type, date_created, payload);"
|
|
|
|
#define TABLE_ACLK_CHART_LATEST "CREATE TABLE IF NOT EXISTS aclk_chart_latest_%s (uuid BLOB PRIMARY KEY, " \
|
|
"unique_id, date_submitted);"
|
|
|
|
#define TRIGGER_ACLK_CHART_PAYLOAD "CREATE TRIGGER IF NOT EXISTS aclk_tr_chart_payload_%s " \
|
|
"after insert on aclk_chart_payload_%s " \
|
|
"begin insert into aclk_chart_%s (uuid, unique_id, type, status, date_created) values " \
|
|
" (new.uuid, new.unique_id, new.type, 'pending', unixepoch()) on conflict(uuid, status) " \
|
|
" do update set unique_id = new.unique_id, update_count = update_count + 1; " \
|
|
"end;"
|
|
|
|
#define TABLE_ACLK_ALERT "CREATE TABLE IF NOT EXISTS aclk_alert_%s (sequence_id INTEGER PRIMARY KEY, " \
|
|
"alert_unique_id, date_created, date_submitted, date_cloud_ack, " \
|
|
"unique(alert_unique_id));"
|
|
|
|
#define INDEX_ACLK_CHART "CREATE INDEX IF NOT EXISTS aclk_chart_index_%s ON aclk_chart_%s (unique_id);"
|
|
|
|
#define INDEX_ACLK_CHART_LATEST "CREATE INDEX IF NOT EXISTS aclk_chart_latest_index_%s ON aclk_chart_latest_%s (unique_id);"
|
|
|
|
#define INDEX_ACLK_ALERT "CREATE INDEX IF NOT EXISTS aclk_alert_index_%s ON aclk_alert_%s (alert_unique_id);"
|
|
|
|
enum aclk_database_opcode {
|
|
ACLK_DATABASE_NOOP = 0,
|
|
|
|
ACLK_DATABASE_ADD_CHART,
|
|
ACLK_DATABASE_ADD_DIMENSION,
|
|
ACLK_DATABASE_PUSH_CHART,
|
|
ACLK_DATABASE_PUSH_CHART_CONFIG,
|
|
ACLK_DATABASE_RESET_CHART,
|
|
ACLK_DATABASE_CHART_ACK,
|
|
ACLK_DATABASE_UPD_RETENTION,
|
|
ACLK_DATABASE_DIM_DELETION,
|
|
ACLK_DATABASE_ORPHAN_HOST,
|
|
ACLK_DATABASE_ALARM_HEALTH_LOG,
|
|
ACLK_DATABASE_CLEANUP,
|
|
ACLK_DATABASE_DELETE_HOST,
|
|
ACLK_DATABASE_NODE_INFO,
|
|
ACLK_DATABASE_PUSH_ALERT,
|
|
ACLK_DATABASE_PUSH_ALERT_CONFIG,
|
|
ACLK_DATABASE_PUSH_ALERT_SNAPSHOT,
|
|
ACLK_DATABASE_QUEUE_REMOVED_ALERTS,
|
|
ACLK_DATABASE_NODE_COLLECTORS,
|
|
ACLK_DATABASE_TIMER,
|
|
|
|
// leave this last
|
|
// we need it to check for worker utilization
|
|
ACLK_MAX_ENUMERATIONS_DEFINED
|
|
};
|
|
|
|
struct aclk_chart_payload_t {
|
|
long sequence_id;
|
|
long last_sequence_id;
|
|
char *payload;
|
|
struct aclk_chart_payload_t *next;
|
|
};
|
|
|
|
|
|
struct aclk_database_cmd {
|
|
enum aclk_database_opcode opcode;
|
|
void *data;
|
|
void *data_param;
|
|
int count;
|
|
uint64_t param1;
|
|
struct aclk_completion *completion;
|
|
};
|
|
|
|
#define ACLK_DATABASE_CMD_Q_MAX_SIZE (16384)
|
|
|
|
struct aclk_database_cmdqueue {
|
|
unsigned head, tail;
|
|
struct aclk_database_cmd cmd_array[ACLK_DATABASE_CMD_Q_MAX_SIZE];
|
|
};
|
|
|
|
struct aclk_database_worker_config {
|
|
uv_thread_t thread;
|
|
char uuid_str[GUID_LEN + 1];
|
|
char node_id[GUID_LEN + 1];
|
|
char host_guid[GUID_LEN + 1];
|
|
char *hostname; // hostname to avoid constant lookups
|
|
uint64_t chart_sequence_id; // last chart_sequence_id
|
|
time_t chart_timestamp; // last chart timestamp
|
|
time_t cleanup_after; // Start a cleanup after this timestamp
|
|
time_t startup_time; // When the sync thread started
|
|
time_t rotation_after;
|
|
uint64_t batch_id; // batch id to use
|
|
uint64_t alerts_batch_id; // batch id for alerts to use
|
|
uint64_t alerts_start_seq_id; // cloud has asked to start streaming from
|
|
uint64_t alert_sequence_id; // last alert sequence_id
|
|
int pause_alert_updates;
|
|
uint32_t chart_payload_count;
|
|
uint64_t alerts_snapshot_id; //will contain the snapshot_id value if snapshot was requested
|
|
uint64_t alerts_ack_sequence_id; //last sequence_id ack'ed from cloud via sendsnapshot message
|
|
uv_loop_t *loop;
|
|
RRDHOST *host;
|
|
uv_async_t async;
|
|
/* FIFO command queue */
|
|
uv_mutex_t cmd_mutex;
|
|
uv_cond_t cmd_cond;
|
|
volatile unsigned queue_size;
|
|
struct aclk_database_cmdqueue cmd_queue;
|
|
uint32_t retry_count;
|
|
int chart_updates;
|
|
int alert_updates;
|
|
time_t batch_created;
|
|
int node_info_send;
|
|
time_t node_collectors_send;
|
|
int chart_pending;
|
|
int chart_reset_count;
|
|
int retention_running;
|
|
volatile unsigned is_shutting_down;
|
|
volatile unsigned is_orphan;
|
|
struct aclk_database_worker_config *next;
|
|
};
|
|
|
|
static inline RRDHOST *find_host_by_node_id(char *node_id)
|
|
{
|
|
uuid_t node_uuid;
|
|
if (unlikely(!node_id))
|
|
return NULL;
|
|
|
|
if (uuid_parse(node_id, node_uuid))
|
|
return NULL;
|
|
|
|
rrd_rdlock();
|
|
RRDHOST *host, *ret = NULL;
|
|
rrdhost_foreach_read(host) {
|
|
if (host->node_id && !(uuid_compare(*host->node_id, node_uuid))) {
|
|
ret = host;
|
|
break;
|
|
}
|
|
}
|
|
rrd_unlock();
|
|
|
|
return ret;
|
|
}
|
|
|
|
|
|
extern sqlite3 *db_meta;
|
|
|
|
extern int aclk_database_enq_cmd_noblock(struct aclk_database_worker_config *wc, struct aclk_database_cmd *cmd);
|
|
extern void aclk_database_enq_cmd(struct aclk_database_worker_config *wc, struct aclk_database_cmd *cmd);
|
|
extern void sql_create_aclk_table(RRDHOST *host, uuid_t *host_uuid, uuid_t *node_id);
|
|
int aclk_worker_enq_cmd(char *node_id, struct aclk_database_cmd *cmd);
|
|
void aclk_data_rotated(void);
|
|
void sql_aclk_sync_init(void);
|
|
void sql_check_aclk_table_list(struct aclk_database_worker_config *wc);
|
|
void sql_delete_aclk_table_list(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd);
|
|
void sql_maint_aclk_sync_database(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd);
|
|
int claimed();
|
|
void aclk_sync_exit_all();
|
|
struct aclk_database_worker_config *find_inactive_wc_by_node_id(char *node_id);
|
|
#endif //NETDATA_SQLITE_ACLK_H
|