mirror of
https://github.com/ntop/ntopng.git
synced 2026-04-30 07:59:35 +00:00
1265 lines
37 KiB
Lua
1265 lines
37 KiB
Lua
--
|
|
-- (C) 2020 - ntop.org
|
|
--
|
|
|
|
local driver = {}
|
|
|
|
local os_utils = require("os_utils")
|
|
local ts_common = require("ts_common")
|
|
local data_retention_utils = require "data_retention_utils"
|
|
local json = require("dkjson")
|
|
|
|
require("rrd_paths")
|
|
|
|
local use_hwpredict = false
|
|
local use_rrd_queue = true
|
|
|
|
local type_to_rrdtype = {
|
|
[ts_common.metrics.counter] = "DERIVE",
|
|
[ts_common.metrics.gauge] = "GAUGE",
|
|
}
|
|
|
|
local aggregation_to_consolidation = {
|
|
[ts_common.aggregation.mean] = "AVERAGE",
|
|
[ts_common.aggregation.max] = "MAX",
|
|
[ts_common.aggregation.min] = "MIN",
|
|
[ts_common.aggregation.last] = "LAST",
|
|
}
|
|
|
|
-- ##############################################
|
|
|
|
local debug_enabled = nil
|
|
local function isDebugEnabled()
|
|
if debug_enabled == nil then
|
|
-- cache it
|
|
debug_enabled = (ntop.getPref("ntopng.prefs.rrd_debug_enabled") == "1")
|
|
end
|
|
|
|
return(debug_enabled)
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:new(options)
|
|
local obj = {
|
|
base_path = options.base_path,
|
|
}
|
|
|
|
setmetatable(obj, self)
|
|
self.__index = self
|
|
|
|
return obj
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:getLatestTimestamp(ifid)
|
|
return os.time()
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
-- Maps second tag name to getRRDName
|
|
local HOST_PREFIX_MAP = {
|
|
host = "",
|
|
mac = "",
|
|
subnet = "net:",
|
|
flowdev_port = "flow_device:",
|
|
sflowdev_port = "sflow:",
|
|
snmp_if = "snmp:",
|
|
host_pool = "pool:",
|
|
}
|
|
local WILDCARD_TAGS = {protocol=1, category=1, l4proto=1, dscp_class=1}
|
|
|
|
local function get_fname_for_schema(schema, tags)
|
|
if schema.options.rrd_fname ~= nil then
|
|
return schema.options.rrd_fname
|
|
end
|
|
|
|
local last_tag = schema._tags[#schema._tags]
|
|
|
|
if WILDCARD_TAGS[last_tag] then
|
|
-- return the last defined tag
|
|
return tags[last_tag]
|
|
end
|
|
|
|
-- e.g. host:contacts -> contacts
|
|
local suffix = string.split(schema.name, ":")[2]
|
|
return suffix
|
|
end
|
|
|
|
local function schema_get_path(schema, tags)
|
|
local parts = {schema.name, }
|
|
local suffix = ""
|
|
local rrd
|
|
|
|
-- ifid is mandatory here
|
|
local ifid = tags.ifid or -1
|
|
local host_or_network = nil
|
|
local parts = string.split(schema.name, ":")
|
|
|
|
if((string.find(schema.name, "iface:") ~= 1) and -- interfaces are only identified by the first tag
|
|
(#schema._tags >= 1)) then -- some schema do not have any tag, e.g. "process:*" schemas
|
|
local prefix = HOST_PREFIX_MAP[parts[1]] or (parts[1] .. ":")
|
|
local suffix = tags[schema._tags[2] or schema._tags[1]] or tags[schema._tags[1]]
|
|
|
|
if(suffix ~= ifid) then
|
|
host_or_network = prefix .. suffix
|
|
else
|
|
-- Avoid repeating the ifid suffix in the path
|
|
host_or_network = prefix .. ""
|
|
end
|
|
end
|
|
|
|
-- Some exceptions to avoid conflicts / keep compatibility
|
|
if parts[1] == "snmp_if" then
|
|
suffix = tags.if_index .. "/"
|
|
elseif (parts[1] == "flowdev_port") or (parts[1] == "sflowdev_port") then
|
|
suffix = tags.port .. "/"
|
|
elseif parts[2] == "ndpi_categories" then
|
|
suffix = "ndpi_categories/"
|
|
elseif parts[2] == "ndpi_flows" then
|
|
suffix = "ndpi_flows/"
|
|
elseif parts[2] == "l4protos" then
|
|
suffix = "l4protos/"
|
|
elseif parts[2] == "dscp" then
|
|
suffix = "dscp/"
|
|
elseif #schema._tags >= 3 then
|
|
local intermediate_tags = {}
|
|
|
|
-- tag1:ifid
|
|
-- tag2:already handled as host_or_network
|
|
-- last tag must be handled separately
|
|
for i=3, #schema._tags-1 do
|
|
intermediate_tags[#intermediate_tags + 1] = tags[schema._tags[i]]
|
|
end
|
|
|
|
local last_tag = schema._tags[#schema._tags]
|
|
|
|
if(not WILDCARD_TAGS[last_tag]) then
|
|
intermediate_tags[#intermediate_tags + 1] = tags[last_tag]
|
|
end
|
|
|
|
if intermediate_tags[1] ~= nil then
|
|
-- All the intermediate tags should be mapped in the path
|
|
suffix = table.concat(intermediate_tags, "/") .. "/"
|
|
end
|
|
end
|
|
|
|
local path = getRRDName(ifid, host_or_network) .. suffix
|
|
local rrd = get_fname_for_schema(schema, tags)
|
|
|
|
return path, rrd
|
|
end
|
|
|
|
function driver.schema_get_full_path(schema, tags)
|
|
local base, rrd = schema_get_path(schema, tags)
|
|
|
|
if((not base) or (not rrd)) then
|
|
return nil
|
|
end
|
|
|
|
local full_path = os_utils.fixPath(base .. "/" .. rrd .. ".rrd")
|
|
|
|
return full_path
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function getRRAParameters(step, resolution, retention_time)
|
|
local aggregation_dp = math.ceil(resolution / step)
|
|
local retention_dp = math.ceil(retention_time / resolution)
|
|
return aggregation_dp, retention_dp
|
|
end
|
|
|
|
-- This is necessary to keep the current RRD format
|
|
local function map_metrics_to_rrd_columns(num)
|
|
if num == 1 then
|
|
return {"num"}
|
|
elseif num == 2 then
|
|
return {"sent", "rcvd"}
|
|
elseif num == 3 then
|
|
return {"ingress", "egress", "inner"}
|
|
elseif num == 4 then
|
|
return {"ingress", "egress", "inner", "other"}
|
|
end
|
|
|
|
-- error
|
|
return nil
|
|
end
|
|
|
|
-- This is necessary to keep the current RRD format
|
|
local function map_rrd_column_to_metrics(schema, column_name)
|
|
if (column_name == "num") or starts(column_name, "num_")
|
|
or (column_name == "drops") or starts(column_name, "tcp_")
|
|
or (column_name == "sent") or (column_name == "ingress")
|
|
or (column_name == "bytes") or (column_name == "packets")
|
|
then
|
|
return 1
|
|
elseif (column_name == "rcvd") or (column_name == "egress") then
|
|
return 2
|
|
elseif (column_name == "inner") then
|
|
return 3
|
|
end
|
|
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "unknown column name (" .. column_name .. ") in schema " .. schema.name)
|
|
return nil
|
|
end
|
|
|
|
local function getConsolidationFunction(schema)
|
|
local fn = schema:getAggregationFunction()
|
|
|
|
if(aggregation_to_consolidation[fn] ~= nil) then
|
|
return(aggregation_to_consolidation[fn])
|
|
end
|
|
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "unknown aggregation function: %s", fn)
|
|
|
|
return("AVERAGE")
|
|
end
|
|
|
|
local function create_rrd(schema, path, timestamp)
|
|
local heartbeat = schema.options.rrd_heartbeat or (schema.options.insertion_step * 2)
|
|
local rrd_type = type_to_rrdtype[schema.options.metrics_type]
|
|
local params = {path, schema.options.insertion_step}
|
|
local cf = getConsolidationFunction(schema)
|
|
|
|
if(timestamp ~= nil) then
|
|
-- RRD start time (--start/-b)
|
|
-- It must be tuned so that the first point of the chart in the subsequent
|
|
-- rrd_update will not be discarded
|
|
params[#params + 1] = timestamp - schema.options.insertion_step
|
|
end
|
|
|
|
local metrics_map = map_metrics_to_rrd_columns(#schema._metrics)
|
|
if not metrics_map then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "unsupported number of metrics (" .. (#schema._metrics) .. ") in schema " .. schema.name)
|
|
return false
|
|
end
|
|
|
|
for idx, metric in ipairs(schema._metrics) do
|
|
params[#params + 1] = "DS:" .. metrics_map[idx] .. ":" .. rrd_type .. ':' .. heartbeat .. ':U:U'
|
|
end
|
|
|
|
for _, rra in ipairs(schema.retention) do
|
|
params[#params + 1] = "RRA:" .. cf .. ":0.5:" .. rra.aggregation_dp .. ":" .. rra.retention_dp
|
|
end
|
|
|
|
if use_hwpredict and schema.hwpredict then
|
|
-- NOTE: at most one RRA, otherwise rrd_update crashes.
|
|
local hwpredict = schema.hwpredict
|
|
params[#params + 1] = "RRA:HWPREDICT:" .. hwpredict.row_count .. ":0.1:0.0035:" .. hwpredict.period
|
|
end
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("ntop.rrd_create(%s) schema=%s",
|
|
table.concat(params, ", "), schema.name))
|
|
end
|
|
|
|
local err = ntop.rrd_create(table.unpack(params))
|
|
if(err ~= nil) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, err)
|
|
return false
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function handle_old_rrd_tune(schema, rrdfile, timestamp)
|
|
-- In this case the only thing we can do is to remove the file and create a new one
|
|
if ntop.getCache("ntopng.cache.rrd_format_change_warning_shown") ~= "1" then
|
|
traceError(TRACE_WARNING, TRACE_CONSOLE, "RRD format change detected, incompatible RRDs will be moved to '.rrd.bak' files")
|
|
ntop.setCache("ntopng.cache.rrd_format_change_warning_shown", "1")
|
|
end
|
|
|
|
os.rename(rrdfile, rrdfile .. ".bak")
|
|
|
|
if(not create_rrd(schema, rrdfile, timestamp)) then
|
|
return false
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
local function add_missing_ds(schema, rrdfile, cur_ds, timestamp)
|
|
local cur_metrics = map_metrics_to_rrd_columns(cur_ds)
|
|
local new_metrics = map_metrics_to_rrd_columns(#schema._metrics)
|
|
|
|
if((cur_metrics == nil) or (new_metrics == nil)) then
|
|
return false
|
|
end
|
|
|
|
if cur_ds >= #new_metrics then
|
|
return false
|
|
end
|
|
|
|
traceError(TRACE_INFO, TRACE_CONSOLE, "RRD format changed [schema=".. schema.name .."], trying to fix " .. rrdfile)
|
|
|
|
local params = {rrdfile, }
|
|
local heartbeat = schema.options.rrd_heartbeat or (schema.options.insertion_step * 2)
|
|
local rrd_type = type_to_rrdtype[schema.options.metrics_type]
|
|
|
|
for idx, metric in ipairs(schema._metrics) do
|
|
local old_name = cur_metrics[idx]
|
|
local new_name = new_metrics[idx]
|
|
|
|
if old_name == nil then
|
|
params[#params + 1] = "DS:" .. new_name .. ":" .. rrd_type .. ':' .. heartbeat .. ':U:U'
|
|
elseif old_name ~= new_name then
|
|
params[#params + 1] = "--data-source-rename"
|
|
params[#params + 1] = old_name ..":" .. new_name
|
|
end
|
|
end
|
|
|
|
local err = ntop.rrd_tune(table.unpack(params))
|
|
if(err ~= nil) then
|
|
if(string.find(err, "unknown data source name") ~= nil) then
|
|
-- the RRD was already mangled by incompatible rrd_tune
|
|
return handle_old_rrd_tune(schema, rrdfile, timestamp)
|
|
else
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, err)
|
|
return false
|
|
end
|
|
end
|
|
|
|
-- Double check as some older implementations do not support adding a column and will silently fail
|
|
local last_update, num_ds = ntop.rrd_lastupdate(rrdfile)
|
|
if num_ds ~= #new_metrics then
|
|
return handle_old_rrd_tune(schema, rrdfile, timestamp)
|
|
end
|
|
|
|
traceError(TRACE_INFO, TRACE_CONSOLE, "RRD successfully fixed: " .. rrdfile)
|
|
return true
|
|
end
|
|
|
|
-- ###############################################
|
|
|
|
-- Converts a number (either decimal or integer) to a string
|
|
-- in a format which is friendly for the subsequent call to rrd_update
|
|
local function number_to_rrd_string(what)
|
|
what = tonumber(what)
|
|
|
|
if(what == nil) then
|
|
return("0")
|
|
elseif(type(what) ~= "number") then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "number_to_rrd_string got a non-number argument: " .. type(what))
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, debug.traceback())
|
|
return("0")
|
|
elseif(what ~= what) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "Trying to convert NaN to integer")
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, debug.traceback())
|
|
return("0")
|
|
elseif(what == math.huge) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "Trying to convert inf to integer")
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, debug.traceback())
|
|
return("0")
|
|
elseif((what >= math.maxinteger) or (what <= math.mininteger)) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "Number out of integers range: " .. what)
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, debug.traceback())
|
|
return("0")
|
|
elseif what == math.floor(what) then
|
|
-- If the number has no decimal place, print it as a digit
|
|
return(string.format("%d", what))
|
|
else
|
|
-- If the number has decimal places, print it as a float
|
|
-- (don't touch the precision, let's the rrd do this job if necessary)
|
|
return(string.format("%f", what))
|
|
end
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function update_rrd(schema, rrdfile, timestamp, data, dont_recover)
|
|
local params = { number_to_rrd_string(timestamp), }
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("Going to update %s [%s]", schema.name, rrdfile))
|
|
end
|
|
|
|
-- Verify last update time
|
|
local last_update = ntop.rrd_lastupdate(rrdfile)
|
|
|
|
if((last_update ~= nil) and (timestamp <= last_update)) then
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE,
|
|
string.format("Skip RRD update in the past: timestamp=%u but last_update=%u",
|
|
timestamp, last_update))
|
|
end
|
|
|
|
return false
|
|
end
|
|
|
|
for _, metric in ipairs(schema._metrics) do
|
|
params[#params + 1] = number_to_rrd_string(data[metric])
|
|
end
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("ntop.rrd_update(%s, %s) schema=%s",
|
|
rrdfile, table.concat(params, ", "), schema.name))
|
|
end
|
|
|
|
local err = ntop.rrd_update(rrdfile, table.unpack(params))
|
|
if(err ~= nil) then
|
|
if(dont_recover ~= true) then
|
|
-- Try to recover
|
|
local last_update, num_ds = ntop.rrd_lastupdate(rrdfile)
|
|
local retry = false
|
|
|
|
if((num_ds ~= nil) and (num_ds < #schema._metrics)) then
|
|
if add_missing_ds(schema, rrdfile, num_ds, timestamp) then
|
|
retry = true
|
|
end
|
|
elseif((num_ds == 2) and (schema.name == "iface:traffic")) then
|
|
-- The RRD is corrupted due to collision between "iface:traffic" and "evexporter_iface:traffic"
|
|
traceError(TRACE_WARNING, TRACE_CONSOLE, "'evexporter_iface:traffic' schema collision detected on " .. rrdfile .. ", moving RRD to .old")
|
|
local rv, errmsg = os.rename(rrdfile, rrdfile..".old")
|
|
|
|
if(rv == nil) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, errmsg)
|
|
return false
|
|
end
|
|
|
|
if(not create_rrd(schema, rrdfile, timestamp)) then
|
|
return false
|
|
end
|
|
|
|
retry = true
|
|
end
|
|
|
|
if retry then
|
|
-- Problem possibly fixed, retry
|
|
return update_rrd(schema, rrdfile, timestamp, data, true --[[ do not recovery again ]])
|
|
end
|
|
end
|
|
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, err)
|
|
return false
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function ts2json(rrdfile, schema, timestamp, tags, metrics)
|
|
local what = { }
|
|
local j
|
|
|
|
what.file = rrdfile
|
|
what.params = { number_to_rrd_string(timestamp) }
|
|
|
|
for _, metric in ipairs(schema._metrics) do
|
|
what.params[#params + 1] = number_to_rrd_string(metrics[metric])
|
|
end
|
|
|
|
return(json.encode(what))
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function log_ts(rrdfile, schema, timestamp, tags, metrics)
|
|
local j = ts2json(rrdfile, schema, timestamp, tags, metrics)
|
|
|
|
if(schema.options.is_critical_ts) then
|
|
critical = "[Critical]"
|
|
else
|
|
critical = ""
|
|
end
|
|
|
|
io.write("[RRD]"..critical.."[Step: ".. schema.options.step .."]["..j.."]\n")
|
|
|
|
return(j)
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:append(schema, timestamp, tags, metrics)
|
|
local base, rrd = schema_get_path(schema, tags)
|
|
local rrdfile = os_utils.fixPath(base .. "/" .. rrd .. ".rrd")
|
|
|
|
if use_rrd_queue then
|
|
if not schema.options.is_critical_ts then
|
|
local res = interface.rrd_enqueue(schema.name, timestamp, tags, metrics)
|
|
|
|
if not res then
|
|
ntop.rrd_inc_num_drops()
|
|
end
|
|
|
|
return res
|
|
end
|
|
end
|
|
|
|
if not ntop.notEmptyFile(rrdfile) then
|
|
ntop.mkdir(base)
|
|
if not create_rrd(schema, rrdfile, timestamp) then
|
|
return false
|
|
end
|
|
end
|
|
|
|
return update_rrd(schema, rrdfile, timestamp, metrics)
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function makeTotalSerie(series, count)
|
|
local total = {}
|
|
local nan = 0/0
|
|
|
|
for i=1, count do
|
|
total[i] = nan
|
|
end
|
|
|
|
for _, serie in pairs(series) do
|
|
for i, val in pairs(serie.data) do
|
|
local old_v = total[i]
|
|
local old_is_nan = (old_v ~= old_v)
|
|
local val_is_nan = (val ~= val)
|
|
|
|
if(old_is_nan and (not val_is_nan)) then
|
|
-- Avoid NaN sum
|
|
total[i] = val
|
|
elseif((not old_is_nan) and val_is_nan) then
|
|
-- Avoid NaN sum
|
|
total[i] = old_v
|
|
else
|
|
-- Both are NaN / non NaN
|
|
total[i] = old_v + val
|
|
end
|
|
end
|
|
end
|
|
|
|
return total
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function sampleSeries(schema, cur_points, step, max_points, series)
|
|
local sampled_dp = math.ceil(cur_points / max_points)
|
|
local count = nil
|
|
local nan = 0/0
|
|
|
|
for _, data_serie in pairs(series) do
|
|
local serie = data_serie.data
|
|
local num = 0
|
|
local sum = 0
|
|
local all_nan = true
|
|
local end_idx = 1
|
|
|
|
for idx, dp in ipairs(serie) do
|
|
if(dp ~= dp) then
|
|
-- Convert NaN to 0 to calculate the sums
|
|
dp = 0
|
|
else
|
|
all_nan = false
|
|
end
|
|
|
|
sum = sum + dp
|
|
num = num + 1
|
|
|
|
if num == sampled_dp then
|
|
-- A data group is ready
|
|
if all_nan then
|
|
-- If all the points into the datagroup are NaN, calculate them
|
|
-- as NaN
|
|
sum = nan
|
|
end
|
|
|
|
serie[end_idx] = sum / num
|
|
end_idx = end_idx + 1
|
|
|
|
num = 0
|
|
sum = 0
|
|
all_nan = true
|
|
end
|
|
end
|
|
|
|
-- Last group
|
|
if num > 0 then
|
|
if all_nan then
|
|
sum = nan
|
|
end
|
|
|
|
serie[end_idx] = sum / num
|
|
end_idx = end_idx + 1
|
|
end
|
|
|
|
count = end_idx-1
|
|
|
|
-- remove the exceeding points
|
|
for i = end_idx, #serie do
|
|
serie[i] = nil
|
|
end
|
|
end
|
|
|
|
-- new step, new count, new data
|
|
return step * sampled_dp, count
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
-- Make sure we do not fetch data from RRDs that have been update too much long ago
|
|
-- as this creates issues with the consolidation functions when we want to compare
|
|
-- results coming from different RRDs.
|
|
-- This is also needed to make sure that multiple data series on graphs have the
|
|
-- same number of points, otherwise d3js will generate errors.
|
|
local function touchRRD(rrdname)
|
|
local now = os.time()
|
|
local last, ds_count = ntop.rrd_lastupdate(rrdname)
|
|
|
|
if((last ~= nil) and ((now-last) > 3600)) then
|
|
local tdiff = now - 1800 -- This avoids to set the update continuously
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("touchRRD(%s, %u), last_update was %u",
|
|
rrdname, tdiff, last))
|
|
end
|
|
|
|
if(ds_count == 1) then
|
|
ntop.rrd_update(rrdname, tdiff.."", "0")
|
|
elseif(ds_count == 2) then
|
|
ntop.rrd_update(rrdname, tdiff.."", "0", "0")
|
|
elseif(ds_count == 3) then
|
|
ntop.rrd_update(rrdname, tdiff.."", "0", "0", "0")
|
|
elseif(ds_count == 4) then
|
|
ntop.rrd_update(rrdname, tdiff.."", "0", "0", "0", "0")
|
|
end
|
|
end
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:query(schema, tstart, tend, tags, options)
|
|
local base, rrd = schema_get_path(schema, tags)
|
|
local rrdfile = os_utils.fixPath(base .. "/" .. rrd .. ".rrd")
|
|
|
|
if not ntop.notEmptyFile(rrdfile) then
|
|
return nil
|
|
end
|
|
|
|
touchRRD(rrdfile)
|
|
|
|
local last_update = ntop.rrd_lastupdate(rrdfile)
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("RRD_FETCH schema=%s %s -> (%s): last_update=%u",
|
|
schema.name, table.tconcat(tags, "=", ","), rrdfile, last_update))
|
|
end
|
|
|
|
-- Avoid reporting the last point when the timeseries write has not completed
|
|
-- yet. Use 2*step as a bound.
|
|
if((tend > last_update) and ((tend - last_update) <= 2*schema.options.step)) then
|
|
tend = last_update
|
|
end
|
|
|
|
--tprint("rrdtool fetch ".. rrdfile.. " " .. getConsolidationFunction(schema) .. " -s ".. tstart .. " -e " .. tend)
|
|
local fstart, fstep, fdata, fend, fcount = ntop.rrd_fetch_columns(rrdfile, getConsolidationFunction(schema), tstart, tend)
|
|
|
|
if fdata == nil then
|
|
return nil
|
|
end
|
|
|
|
local count = 0
|
|
local series = {}
|
|
|
|
for name_key, serie in pairs(fdata) do
|
|
local serie_idx = map_rrd_column_to_metrics(schema, name_key)
|
|
local name = schema._metrics[serie_idx]
|
|
local max_val = ts_common.getMaxPointValue(schema, name, tags)
|
|
count = 0
|
|
|
|
-- unify the format
|
|
for i, v in pairs(serie) do
|
|
local v = ts_common.normalizeVal(v, max_val, options)
|
|
serie[i] = v
|
|
count = count + 1
|
|
end
|
|
|
|
-- Remove the last value: RRD seems to give an additional point
|
|
serie[#serie] = nil
|
|
count = count - 1
|
|
|
|
series[serie_idx] = {label=name, data=serie}
|
|
|
|
serie_idx = serie_idx + 1
|
|
end
|
|
|
|
-- table.clone needed as series can be modified below (sampleSeries works on it in-place)
|
|
local unsampled_series = table.clone(series)
|
|
local unsampled_count = count
|
|
local unsampled_fstep = fstep
|
|
|
|
if count > options.max_num_points then
|
|
fstep, count = sampleSeries(schema, count, fstep, options.max_num_points, series)
|
|
end
|
|
|
|
--local returned_tend = fstart + fstep * (count-1)
|
|
--tprint(returned_tend .. " " .. fstart)
|
|
|
|
local total_serie = nil
|
|
local stats = nil
|
|
|
|
if options.calculate_stats then
|
|
total_serie = makeTotalSerie(series, count)
|
|
stats = ts_common.calculateStatistics(makeTotalSerie(unsampled_series, unsampled_count), unsampled_fstep, tend - tstart, schema.options.metrics_type)
|
|
stats = stats or {}
|
|
stats.by_serie = {}
|
|
|
|
-- Also calculate per-serie statistics
|
|
for k, v in pairs(series) do
|
|
local s = ts_common.calculateStatistics(v.data, unsampled_fstep, tend - tstart, schema.options.metrics_type)
|
|
stats.by_serie[k] = s
|
|
end
|
|
end
|
|
|
|
if options.initial_point then
|
|
local _, _, initial_pt = ntop.rrd_fetch_columns(rrdfile, getConsolidationFunction(schema), tstart-schema.options.step, tstart-schema.options.step)
|
|
initial_pt = initial_pt or {}
|
|
|
|
for name_key, values in pairs(initial_pt) do
|
|
local serie_idx = map_rrd_column_to_metrics(schema, name_key)
|
|
local name = schema._metrics[serie_idx]
|
|
local max_val = ts_common.getMaxPointValue(schema, name, tags)
|
|
local ptval = ts_common.normalizeVal(values[1], max_val, options)
|
|
|
|
table.insert(series[serie_idx].data, 1, ptval)
|
|
end
|
|
|
|
count = count + 1
|
|
|
|
if total_serie then
|
|
-- recalculate with additional point
|
|
total_serie = makeTotalSerie(series, count)
|
|
end
|
|
end
|
|
|
|
if options.calculate_stats then
|
|
stats = table.merge(stats, ts_common.calculateMinMax(total_serie))
|
|
end
|
|
|
|
return {
|
|
start = fstart,
|
|
step = fstep,
|
|
count = count,
|
|
series = series,
|
|
statistics = stats,
|
|
additional_series = {
|
|
total = total_serie,
|
|
},
|
|
}
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
-- *Limitation*
|
|
-- tags_filter is expected to contain all the tags of the schema except the last
|
|
-- one. For such tag, a list of available values will be returned.
|
|
function driver:listSeries(schema, tags_filter, wildcard_tags, start_time)
|
|
if #wildcard_tags > 1 then
|
|
tprint({schema_name = schema.name, wildcards=wildcard_tags})
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "RRD driver does not support listSeries on multiple tags")
|
|
return nil
|
|
end
|
|
|
|
local wildcard_tag = wildcard_tags[1]
|
|
|
|
if not wildcard_tag then
|
|
local full_path = driver.schema_get_full_path(schema, tags_filter)
|
|
local last_update = ntop.rrd_lastupdate(full_path)
|
|
|
|
if last_update ~= nil and last_update >= start_time then
|
|
return {tags_filter}
|
|
else
|
|
return nil
|
|
end
|
|
end
|
|
|
|
if wildcard_tag ~= schema._tags[#schema._tags] then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "RRD driver only support listSeries with wildcard in the last tag, got wildcard on '" .. wildcard_tag .. "'")
|
|
return nil
|
|
end
|
|
|
|
local base, rrd = schema_get_path(schema, table.merge(tags_filter, {[wildcard_tag] = ""}))
|
|
local files = ntop.readdir(base)
|
|
local res = {}
|
|
|
|
for f in pairs(files or {}) do
|
|
local v = string.split(f, "%.rrd")
|
|
local fpath = base .. "/" .. f
|
|
|
|
if((v ~= nil) and (#v == 1)) then
|
|
local last_update = ntop.rrd_lastupdate(fpath)
|
|
|
|
if last_update ~= nil and last_update >= start_time then
|
|
local value = v[1]
|
|
local toadd = false
|
|
|
|
if wildcard_tag == "if_index" then
|
|
-- NOTE: needed to add this crazy exception. Don't now what it is
|
|
-- but it's needed, otherwise this function is tricked into thinking
|
|
-- other timeseries (such as snmp_dev:cpu_states) are if_index
|
|
--
|
|
-- This is what we get:
|
|
-- 1.device string 192.168.2.1
|
|
-- 1.ifid string -1
|
|
-- 1.if_index string 5
|
|
-- 2 table
|
|
-- 2.device string 192.168.2.1
|
|
-- 2.ifid string -1
|
|
-- 2.if_index string 2
|
|
-- 3 table
|
|
-- 3.device string 192.168.2.1
|
|
-- 3.ifid string -1
|
|
-- 3.if_index string cpu_states <<<<<<<<<<<<<<<<< don't know why this happens to be here
|
|
-- 4 table
|
|
--
|
|
if tonumber(value) then
|
|
toadd = true
|
|
end
|
|
elseif wildcard_tag == "dscp_class" then
|
|
toadd = true
|
|
elseif wildcard_tag == "l4proto" then
|
|
if L4_PROTO_KEYS[value] ~= nil then
|
|
toadd = true
|
|
end
|
|
elseif ((wildcard_tag ~= "protocol") or ((L4_PROTO_KEYS[value] == nil) and (interface.getnDPIProtoId(value) ~= -1))) and
|
|
((wildcard_tag ~= "category") or (interface.getnDPICategoryId(value) ~= -1)) then
|
|
toadd = true
|
|
end
|
|
|
|
if toadd then
|
|
res[#res + 1] = table.merge(tags_filter, {[wildcard_tag] = value})
|
|
end
|
|
end
|
|
elseif ntop.isdir(fpath) then
|
|
fpath = fpath .. "/" .. rrd .. ".rrd"
|
|
|
|
local last_update = ntop.rrd_lastupdate(fpath)
|
|
|
|
if last_update ~= nil and last_update >= start_time then
|
|
res[#res + 1] = table.merge(tags_filter, {[wildcard_tag] = f})
|
|
end
|
|
end
|
|
end
|
|
|
|
return res
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:topk(schema, tags, tstart, tend, options, top_tags)
|
|
if #top_tags > 1 then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "RRD driver does not support topk on multiple tags")
|
|
return nil
|
|
end
|
|
|
|
local top_tag = top_tags[1]
|
|
|
|
if top_tag ~= schema._tags[#schema._tags] then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "RRD driver only support topk with topk tag in the last tag, got topk on '" .. (top_tag or "") .. "'")
|
|
return nil
|
|
end
|
|
|
|
local series = driver:listSeries(schema, tags, top_tags, tstart)
|
|
if not series then
|
|
return nil
|
|
end
|
|
|
|
local items = {}
|
|
local tag_2_series = {}
|
|
local total_serie = {}
|
|
local total_valid = true
|
|
local step = 0
|
|
local query_start = tstart
|
|
local cf = getConsolidationFunction(schema)
|
|
|
|
if options.initial_point then
|
|
query_start = tstart - schema.options.step
|
|
end
|
|
|
|
for _, serie_tags in pairs(series) do
|
|
local rrdfile = driver.schema_get_full_path(schema, serie_tags)
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("RRD_FETCH[topk] schema=%s %s[%s] -> (%s): last_update=%u",
|
|
schema.name, table.tconcat(tags, "=", ","), table.concat(top_tags, ","), rrdfile, ntop.rrd_lastupdate(rrdfile)))
|
|
end
|
|
|
|
touchRRD(rrdfile)
|
|
|
|
local fstart, fstep, fdata, fend, fcount = ntop.rrd_fetch_columns(rrdfile, cf, query_start, tend)
|
|
local sum = 0
|
|
|
|
if fdata == nil then
|
|
goto continue
|
|
end
|
|
|
|
step = fstep
|
|
|
|
local partials = {}
|
|
|
|
for name_key, serie in pairs(fdata) do
|
|
local serie_idx = map_rrd_column_to_metrics(schema, name_key)
|
|
local name = schema._metrics[serie_idx]
|
|
local max_val = ts_common.getMaxPointValue(schema, name, serie_tags)
|
|
partials[name] = 0
|
|
|
|
-- Remove the last value: RRD seems to give an additional point
|
|
serie[#serie] = nil
|
|
|
|
if (#total_serie ~= 0) and #total_serie ~= #serie then
|
|
-- NOTE: even if touchRRD is used, series can still have a different number
|
|
-- of points when the tend parameter does not correspond to the current time
|
|
-- e.g. when comparing with the past or manually zooming.
|
|
-- In this case, total serie il discarded as it's incorrect
|
|
total_valid = false
|
|
end
|
|
|
|
for i=#total_serie + 1, #serie do
|
|
-- init
|
|
total_serie[i] = 0
|
|
end
|
|
|
|
for i, v in pairs(serie) do
|
|
local v = ts_common.normalizeVal(v, max_val, options)
|
|
|
|
if type(v) == "number" then
|
|
sum = sum + v
|
|
partials[name] = partials[name] + v * step
|
|
total_serie[i] = total_serie[i] + v
|
|
end
|
|
end
|
|
end
|
|
|
|
items[serie_tags[top_tag]] = sum * step
|
|
tag_2_series[serie_tags[top_tag]] = {serie_tags, partials}
|
|
::continue::
|
|
end
|
|
|
|
local topk = {}
|
|
|
|
for top_item, value in pairsByValues(items, rev) do
|
|
if value > 0 then
|
|
topk[#topk + 1] = {
|
|
tags = tag_2_series[top_item][1],
|
|
value = value,
|
|
partials = tag_2_series[top_item][2],
|
|
}
|
|
end
|
|
|
|
if #topk >= options.top then
|
|
break
|
|
end
|
|
end
|
|
|
|
local stats = nil
|
|
|
|
-- table.clone needed as augumented_total can be modified below (sampleSeries works on it in-place)
|
|
local augumented_total = table.clone(total_serie)
|
|
|
|
if options.initial_point and total_serie then
|
|
-- remove initial point to avoid stats calculation on it
|
|
table.remove(total_serie, 1)
|
|
end
|
|
|
|
local fstep, count = sampleSeries(schema, #augumented_total, step, options.max_num_points, {{data=augumented_total}})
|
|
|
|
if options.calculate_stats then
|
|
stats = ts_common.calculateStatistics(total_serie, step, tend - tstart, schema.options.metrics_type)
|
|
stats = table.merge(stats, ts_common.calculateMinMax(augumented_total))
|
|
end
|
|
|
|
if not total_valid then
|
|
total_serie = nil
|
|
augumented_total = nil
|
|
end
|
|
|
|
return {
|
|
topk = topk,
|
|
additional_series = {
|
|
total = augumented_total,
|
|
},
|
|
statistics = stats,
|
|
}
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:queryTotal(schema, tstart, tend, tags, options)
|
|
local rrdfile = driver.schema_get_full_path(schema, tags)
|
|
|
|
if not ntop.notEmptyFile(rrdfile) then
|
|
return nil
|
|
end
|
|
|
|
touchRRD(rrdfile)
|
|
|
|
local fstart, fstep, fdata, fend, fcount = ntop.rrd_fetch_columns(rrdfile, getConsolidationFunction(schema), tstart, tend)
|
|
local totals = {}
|
|
|
|
for name_key, serie in pairs(fdata or {}) do
|
|
local serie_idx = map_rrd_column_to_metrics(schema, name_key)
|
|
local name = schema._metrics[serie_idx]
|
|
local max_val = ts_common.getMaxPointValue(schema, name, tags)
|
|
local sum = 0
|
|
|
|
-- Remove the last value: RRD seems to give an additional point
|
|
serie[#serie] = nil
|
|
|
|
for i, v in pairs(serie) do
|
|
local v = ts_common.normalizeVal(v, max_val, options)
|
|
|
|
if type(v) == "number" then
|
|
sum = sum + v * fstep
|
|
end
|
|
end
|
|
|
|
totals[name] = sum
|
|
end
|
|
|
|
return totals
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
local function deleteAllData(ifid)
|
|
local paths = getRRDPaths()
|
|
|
|
for _, path in pairs(paths) do
|
|
local ifpath = os_utils.fixPath(dirs.workingdir .. "/" .. ifid .. "/".. path .."/")
|
|
local path_to_del = os_utils.fixPath(ifpath)
|
|
|
|
if ntop.exists(path_to_del) and not ntop.rmdir(path_to_del) then
|
|
return false
|
|
end
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:delete(schema_prefix, tags)
|
|
if schema_prefix == "" then
|
|
-- Delete all data
|
|
return deleteAllData(tags.ifid)
|
|
end
|
|
|
|
-- In RRD we must determine the root path of a given entity (e.g. of an
|
|
-- host if schema_prefix is "host", of a network if schema_prefix is "subnet"
|
|
-- and so on). In order to do so, we list all the schemas starting with the
|
|
-- given prefix, then determine the shortest path to be deleted.
|
|
--
|
|
-- E.g. for ts_utils.delete("mac", {ifid=1, mac="11:22:33:44:55:66"})
|
|
-- we find the following paths:
|
|
-- - /var/lib/ntopng/-1/rrd/macs/11_22_33/44/55/66 (schema "mac:traffic")
|
|
-- - /var/lib/ntopng/-1/rrd/macs/11_22_33/44/55/66/ndpi_categories (schema "mac:ndpi_categories")
|
|
-- We delete the shortest ("/var/lib/ntopng/-1/rrd/macs/11_22_33/44/55/66") as it includes the other.
|
|
--
|
|
-- NOTE: this logic assumes that schemas are well defined, which
|
|
-- means that:
|
|
-- - The first tag is the "ifid" tag
|
|
-- - Tags are defined in order of cardinality, e.g. the "host" tag is
|
|
-- defined before the "protocol" tag
|
|
local ts_utils = require "ts_utils" -- required to get the schemas
|
|
local num_valorized_tags = table.len(tags)
|
|
local s_prefix = schema_prefix .. ""
|
|
|
|
if(num_valorized_tags < 1) then
|
|
traceError(TRACE_ERROR, TRACE_CONSOLE, "At least 1 tags must be specified for the delete operation")
|
|
return false
|
|
end
|
|
|
|
local found = nil
|
|
|
|
-- Iterate the entity schemas and find the shortest RRD directory path
|
|
for k, s in pairs(ts_utils.getLoadedSchemas()) do
|
|
if starts(k, s_prefix) then
|
|
local unreleted = false
|
|
|
|
-- Ensure that all the tags are valorized in order to avoid
|
|
-- deleting unrelated data
|
|
for k in pairs(tags) do
|
|
if(s.tags[k] == nil) then
|
|
-- Missing tag, this schema is possibly unrelated
|
|
unreleted = true
|
|
break
|
|
end
|
|
end
|
|
|
|
if(not unreleted) then
|
|
local check_tags = {}
|
|
|
|
-- Fill the missing tags with empty strings to account them as
|
|
-- possible shortest paths
|
|
for k in pairs(s.tags) do
|
|
check_tags[k] = tags[k] or ""
|
|
end
|
|
|
|
local path = schema_get_path(s, check_tags)
|
|
|
|
-- Choose the shortest string to pick the path that includes the others
|
|
if path and ((found == nil) or (string.len(path) < string.len(found))) then
|
|
found = path
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
if(not found) then
|
|
return false
|
|
end
|
|
|
|
local path_to_del = os_utils.fixPath(found)
|
|
|
|
if ntop.exists(path_to_del) and not ntop.rmdir(path_to_del) then
|
|
return false
|
|
end
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("DELETE schema=%s, %s => %s",
|
|
schema_prefix, table.tconcat(tags, "=", ","), path_to_del))
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:deleteOldData(ifid)
|
|
local paths = getRRDPaths()
|
|
local dirs = ntop.getDirs()
|
|
local retention_days = data_retention_utils.getDataRetentionDays()
|
|
|
|
for _, path in pairs(paths) do
|
|
local ifpath = os_utils.fixPath(dirs.workingdir .. "/" .. ifid .. "/".. path .."/")
|
|
local deadline = retention_days * 86400
|
|
|
|
if isDebugEnabled() then
|
|
traceError(TRACE_NORMAL, TRACE_CONSOLE, string.format("ntop.deleteOldRRDs(%s, %u)", ifpath, deadline))
|
|
end
|
|
|
|
ntop.deleteOldRRDs(ifpath, deadline)
|
|
end
|
|
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:setup(ts_utils)
|
|
return true
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
-- Parses a line in line protocol format (https://docs.influxdata.com/influxdb/v1.7/write_protocols/line_protocol_tutorial/)
|
|
-- into tags and metrics
|
|
local function line_protocol_to_tags_and_metrics(protocol_line)
|
|
-- An example of line protocol is the following
|
|
--
|
|
-- weather,location=us-midwest temperature=82 1465839830100400200
|
|
-- | -------------------- -------------- |
|
|
-- | | | |
|
|
-- | | | |
|
|
-- +-----------+--------+-+---------+-+---------+
|
|
-- |measurement|,tag_set| |field_set| |timestamp|
|
|
-- +-----------+--------+-+---------+-+---------+
|
|
--
|
|
-- NOTE: no need to worry about possible spaces in the tag names. As we are using a regexp to parse
|
|
-- the line, and regexps are greedy, spaces in the tags won't be of any issue. Examples that are correctly parsed are:
|
|
--
|
|
-- local test_line2 = "iface:traffic_rxtx,ifid=0 bytes_sent=849500,bytes_rcvd=5134958 1583007829\n"
|
|
-- local test_line = "iface:traffic_rxtx,ifid=0,ndpi_category=My Category,ndpi_proto=Apple iTunes,host=1.2.3.4 bytes_sent=849500,bytes_rcvd=5134958 1583007829\n"
|
|
--
|
|
local measurement_and_tag_set, field_set, timestamp = protocol_line:match("(.+)%s(.+)%s(.+)\n")
|
|
|
|
local measurement
|
|
local tags = {}
|
|
local metrics = {}
|
|
|
|
-- Parse measurement and tags
|
|
local items = measurement_and_tag_set:split(",")
|
|
if not items then
|
|
-- no tag set, just the measurement
|
|
measurement = measurement_and_tag_set
|
|
else
|
|
-- measurement is at position 1, tags at positions 2+
|
|
measurement = items[1]
|
|
for i=2,#items do
|
|
local tag_items = items[i]:split("=")
|
|
if tag_items and #tag_items == 2 then
|
|
tags[tag_items[1]] = tonumber(tag_items[2]) or tag_items[2]
|
|
end
|
|
end
|
|
end
|
|
|
|
-- Parse metrics
|
|
local items = field_set:split(",")
|
|
if not items then
|
|
-- Just one metric
|
|
items = {field_set}
|
|
end
|
|
|
|
for i=1,#items do
|
|
local field_items = items[i]:split("=")
|
|
|
|
if field_items and #field_items == 2 then
|
|
metrics[field_items[1]] = tonumber(field_items[2]) or field_items[2]
|
|
end
|
|
end
|
|
|
|
local res = {schema_name = measurement, tags = tags, metrics = metrics, timestamp = tonumber(timestamp)}
|
|
|
|
return res
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
function driver:export()
|
|
if(not(use_rrd_queue)) then
|
|
return -- Nothing to do
|
|
end
|
|
|
|
local ts_utils = require "ts_utils" -- required to get the schema from the schema name
|
|
|
|
local available_interfaces = interface.getIfNames()
|
|
-- Add the system interface to the available interfaces
|
|
available_interfaces[getSystemInterfaceId()] = getSystemInterfaceName()
|
|
local rrd_queue_max_dequeues_per_interface = 8192
|
|
|
|
for cur_ifid, iface in pairs(available_interfaces) do
|
|
for cur_dequeue=1, rrd_queue_max_dequeues_per_interface do
|
|
local ts_point = interface.rrd_dequeue(tonumber(cur_ifid))
|
|
|
|
if not ts_point then
|
|
break
|
|
end
|
|
|
|
local parsed_ts_point = line_protocol_to_tags_and_metrics(ts_point)
|
|
|
|
-- No need to do sanity checks on the schema. This queue is 'private' and should
|
|
-- only be written with valid data already checked.
|
|
local schema = ts_utils.getSchema(parsed_ts_point["schema_name"])
|
|
local timestamp = parsed_ts_point["timestamp"]
|
|
local tags = parsed_ts_point["tags"]
|
|
local metrics = parsed_ts_point["metrics"]
|
|
local base, rrd = schema_get_path(schema, tags)
|
|
local rrdfile = os_utils.fixPath(base .. "/" .. rrd .. ".rrd")
|
|
|
|
if not ntop.notEmptyFile(rrdfile) then
|
|
ntop.mkdir(base)
|
|
if not create_rrd(schema, rrdfile, timestamp) then
|
|
return false
|
|
end
|
|
end
|
|
|
|
update_rrd(schema, rrdfile, timestamp, metrics)
|
|
end
|
|
end
|
|
end
|
|
|
|
-- ##############################################
|
|
|
|
return driver
|