mirror of
https://github.com/zeek/zeek.git
synced 2025-10-02 14:48:21 +00:00
Sumstats: allow users to manage epoch manually
This change allows users to specify an epoch length of 0, which means that the user manually has to finish the epochs. A new next_epoch function is introduced to allow users to manually end epochs. Addresses GH-348
This commit is contained in:
parent
8ffbc69a4d
commit
7362f30c3a
7 changed files with 258 additions and 17 deletions
|
@ -272,6 +272,7 @@ event SumStats::finish_epoch(ss: SumStat)
|
||||||
}
|
}
|
||||||
|
|
||||||
# Schedule the next finish_epoch event.
|
# Schedule the next finish_epoch event.
|
||||||
|
if ( ss$epoch != 0secs )
|
||||||
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -93,12 +93,16 @@ export {
|
||||||
## be referred to later.
|
## be referred to later.
|
||||||
name: string;
|
name: string;
|
||||||
|
|
||||||
## The interval at which this filter should be "broken"
|
## The interval at which this sumstat should be "broken"
|
||||||
## and the *epoch_result* callback called. The
|
## and the *epoch_result* callback called. The
|
||||||
## results are also reset at this time so any threshold
|
## results are also reset at this time so any threshold
|
||||||
## based detection needs to be set to a
|
## based detection needs to be set to a
|
||||||
## value that should be expected to happen within
|
## value that should be expected to happen within
|
||||||
## this epoch.
|
## this epoch.
|
||||||
|
##
|
||||||
|
## Passing an epoch of zero (e.g. ``0 secs``) causes this
|
||||||
|
## sumstat to be set to manual epochs. You will have to manually
|
||||||
|
## end the epoch by calling :zeek:see:`SumStats::next_epoch`.
|
||||||
epoch: interval;
|
epoch: interval;
|
||||||
|
|
||||||
## The reducers for the SumStat.
|
## The reducers for the SumStat.
|
||||||
|
@ -175,6 +179,23 @@ export {
|
||||||
##
|
##
|
||||||
## Returns: A string representation of the metric key.
|
## Returns: A string representation of the metric key.
|
||||||
global key2str: function(key: SumStats::Key): string;
|
global key2str: function(key: SumStats::Key): string;
|
||||||
|
|
||||||
|
## Manually end the current epoch for a sumstat. Calling this function will
|
||||||
|
## cause the end of the epoch processing of sumstats to start. Note that the
|
||||||
|
## epoch will not end immidiately - especially in a cluster settings, a number
|
||||||
|
## of messages need to be exchanged between the cluster nodes.
|
||||||
|
##
|
||||||
|
## Note that this function only can be called if the sumstat was created with
|
||||||
|
## an epoch time of zero (manual epochs).
|
||||||
|
##
|
||||||
|
## In a cluster, this function must be called on the manager; it will not have
|
||||||
|
## any effect when called on workers.
|
||||||
|
##
|
||||||
|
## ss_name: SumStat name.
|
||||||
|
##
|
||||||
|
## Returns: true on success, false on failure. Failures can be: sumstat not found,
|
||||||
|
## or sumstat not created for manual epochs.
|
||||||
|
global next_epoch: function(ss_name: string): bool;
|
||||||
}
|
}
|
||||||
|
|
||||||
# The function prototype for plugins to do calculations.
|
# The function prototype for plugins to do calculations.
|
||||||
|
@ -248,6 +269,19 @@ global data_added: function(ss: SumStat, key: Key, result: Result);
|
||||||
# framework for clustered or non-clustered usage.
|
# framework for clustered or non-clustered usage.
|
||||||
global finish_epoch: event(ss: SumStat);
|
global finish_epoch: event(ss: SumStat);
|
||||||
|
|
||||||
|
function next_epoch(ss_name: string): bool
|
||||||
|
{
|
||||||
|
if ( ss_name !in stats_store )
|
||||||
|
return F;
|
||||||
|
|
||||||
|
local ss = stats_store[ss_name];
|
||||||
|
if ( ss$epoch != 0secs )
|
||||||
|
return F;
|
||||||
|
|
||||||
|
event SumStats::finish_epoch(ss);
|
||||||
|
return T;
|
||||||
|
}
|
||||||
|
|
||||||
function key2str(key: Key): string
|
function key2str(key: Key): string
|
||||||
{
|
{
|
||||||
local out = "";
|
local out = "";
|
||||||
|
@ -396,6 +430,9 @@ function create(ss: SumStat)
|
||||||
}
|
}
|
||||||
|
|
||||||
reset(ss);
|
reset(ss);
|
||||||
|
|
||||||
|
## do not schedule epoch if this is set to manual epochs.
|
||||||
|
if ( ss$epoch != 0secs )
|
||||||
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -61,6 +61,7 @@ event SumStats::finish_epoch(ss: SumStat)
|
||||||
reset(ss);
|
reset(ss);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if ( ss$epoch != 0secs )
|
||||||
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
schedule ss$epoch { SumStats::finish_epoch(ss) };
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,11 @@
|
||||||
|
### BTest baseline data generated by btest-diff. Do not edit. Use "btest -U/-u" to update. Requires BTest >= 0.63.
|
||||||
|
### NOTE: This file has been sorted with diff-sort.
|
||||||
|
Host: 1.2.3.4 - num:9 - sum:437.0 - avg:48.6 - max:95.0 - min:3.0 - var:758.8 - std_dev:27.5 - unique:8 - hllunique:8
|
||||||
|
Host: 10.10.10.10 - num:1 - sum:5.0 - avg:5.0 - max:5.0 - min:5.0 - var:0.0 - std_dev:0.0 - unique:1 - hllunique:1
|
||||||
|
Host: 6.5.4.3 - num:2 - sum:6.0 - avg:3.0 - max:5.0 - min:1.0 - var:8.0 - std_dev:2.8 - unique:2 - hllunique:2
|
||||||
|
Host: 7.2.1.5 - num:2 - sum:145.0 - avg:72.5 - max:91.0 - min:54.0 - var:684.5 - std_dev:26.2 - unique:2 - hllunique:2
|
||||||
|
Performing first epoch, no observations
|
||||||
|
Performing second epoch with overvations
|
||||||
|
Sending ready for data
|
||||||
|
epoch finished, F
|
||||||
|
epoch finished, T
|
|
@ -0,0 +1,8 @@
|
||||||
|
### BTest baseline data generated by btest-diff. Do not edit. Use "btest -U/-u" to update. Requires BTest >= 0.63.
|
||||||
|
Performing first epoch, no observations
|
||||||
|
epoch_finished
|
||||||
|
Performing second epoch with overvations
|
||||||
|
Host: 1.2.3.4 - num:5 - sum:221.0 - var:1144.2 - avg:44.2 - max:94.0 - min:5.0 - std_dev:33.8 - unique:4 - hllunique:4
|
||||||
|
Host: 6.5.4.3 - num:1 - sum:2.0 - var:0.0 - avg:2.0 - max:2.0 - min:2.0 - std_dev:0.0 - unique:1 - hllunique:1
|
||||||
|
Host: 7.2.1.5 - num:1 - sum:1.0 - var:0.0 - avg:1.0 - max:1.0 - min:1.0 - std_dev:0.0 - unique:1 - hllunique:1
|
||||||
|
epoch_finished
|
|
@ -0,0 +1,123 @@
|
||||||
|
# @TEST-PORT: BROKER_PORT1
|
||||||
|
# @TEST-PORT: BROKER_PORT2
|
||||||
|
# @TEST-PORT: BROKER_PORT3
|
||||||
|
#
|
||||||
|
# @TEST-EXEC: btest-bg-run manager-1 ZEEKPATH=$ZEEKPATH:.. CLUSTER_NODE=manager-1 zeek -b %INPUT
|
||||||
|
# @TEST-EXEC: btest-bg-run worker-1 ZEEKPATH=$ZEEKPATH:.. CLUSTER_NODE=worker-1 zeek -b %INPUT
|
||||||
|
# @TEST-EXEC: btest-bg-run worker-2 ZEEKPATH=$ZEEKPATH:.. CLUSTER_NODE=worker-2 zeek -b %INPUT
|
||||||
|
# @TEST-EXEC: btest-bg-wait 30
|
||||||
|
|
||||||
|
# @TEST-EXEC: TEST_DIFF_CANONIFIER=$SCRIPTS/diff-sort btest-diff manager-1/.stdout
|
||||||
|
|
||||||
|
@load base/frameworks/sumstats
|
||||||
|
@load base/frameworks/cluster
|
||||||
|
|
||||||
|
@TEST-START-FILE cluster-layout.zeek
|
||||||
|
redef Cluster::nodes = {
|
||||||
|
["manager-1"] = [$node_type=Cluster::MANAGER, $ip=127.0.0.1, $p=to_port(getenv("BROKER_PORT1"))],
|
||||||
|
["worker-1"] = [$node_type=Cluster::WORKER, $ip=127.0.0.1, $p=to_port(getenv("BROKER_PORT2")), $manager="manager-1", $interface="eth0"],
|
||||||
|
["worker-2"] = [$node_type=Cluster::WORKER, $ip=127.0.0.1, $p=to_port(getenv("BROKER_PORT3")), $manager="manager-1", $interface="eth1"],
|
||||||
|
};
|
||||||
|
@TEST-END-FILE
|
||||||
|
|
||||||
|
redef Log::default_rotation_interval = 0secs;
|
||||||
|
|
||||||
|
global n = 0;
|
||||||
|
global did_data = F;
|
||||||
|
|
||||||
|
event zeek_init() &priority=5
|
||||||
|
{
|
||||||
|
local r1: SumStats::Reducer = [$stream="test", $apply=set(SumStats::SUM, SumStats::MIN, SumStats::MAX, SumStats::AVERAGE, SumStats::STD_DEV, SumStats::VARIANCE, SumStats::UNIQUE, SumStats::HLL_UNIQUE)];
|
||||||
|
SumStats::create([$name="test",
|
||||||
|
$epoch=0secs,
|
||||||
|
$reducers=set(r1),
|
||||||
|
$epoch_result(ts: time, key: SumStats::Key, result: SumStats::Result) =
|
||||||
|
{
|
||||||
|
if ( ! did_data ) return;
|
||||||
|
local r = result["test"];
|
||||||
|
print fmt("Host: %s - num:%d - sum:%.1f - avg:%.1f - max:%.1f - min:%.1f - var:%.1f - std_dev:%.1f - unique:%d - hllunique:%d", key$host, r$num, r$sum, r$average, r$max, r$min, r$variance, r$std_dev, r$unique, r$hll_unique);
|
||||||
|
},
|
||||||
|
$epoch_finished(ts: time) =
|
||||||
|
{
|
||||||
|
print "epoch finished", did_data;
|
||||||
|
if ( did_data )
|
||||||
|
terminate();
|
||||||
|
}]);
|
||||||
|
}
|
||||||
|
|
||||||
|
event Broker::peer_lost(endpoint: Broker::EndpointInfo, msg: string)
|
||||||
|
{
|
||||||
|
terminate();
|
||||||
|
}
|
||||||
|
|
||||||
|
global ready_for_data: event();
|
||||||
|
|
||||||
|
event ready_for_data()
|
||||||
|
{
|
||||||
|
if ( Cluster::node == "worker-1" )
|
||||||
|
{
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=34]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=30]);
|
||||||
|
SumStats::observe("test", [$host=6.5.4.3], [$num=1]);
|
||||||
|
SumStats::observe("test", [$host=7.2.1.5], [$num=54]);
|
||||||
|
}
|
||||||
|
if ( Cluster::node == "worker-2" )
|
||||||
|
{
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=75]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=30]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=3]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=57]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=52]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=61]);
|
||||||
|
SumStats::observe("test", [$host=1.2.3.4], [$num=95]);
|
||||||
|
SumStats::observe("test", [$host=6.5.4.3], [$num=5]);
|
||||||
|
SumStats::observe("test", [$host=7.2.1.5], [$num=91]);
|
||||||
|
SumStats::observe("test", [$host=10.10.10.10], [$num=5]);
|
||||||
|
}
|
||||||
|
|
||||||
|
did_data = T;
|
||||||
|
}
|
||||||
|
|
||||||
|
@if ( Cluster::local_node_type() == Cluster::MANAGER )
|
||||||
|
|
||||||
|
event second_test()
|
||||||
|
{
|
||||||
|
print "Performing second epoch with overvations";
|
||||||
|
local ret = SumStats::next_epoch("test");
|
||||||
|
if ( ! ret )
|
||||||
|
print "Return value false";
|
||||||
|
}
|
||||||
|
|
||||||
|
event send_ready_for_data()
|
||||||
|
{
|
||||||
|
print "Sending ready for data";
|
||||||
|
event ready_for_data();
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
event cont_test()
|
||||||
|
{
|
||||||
|
print "Performing first epoch, no observations";
|
||||||
|
local ret = SumStats::next_epoch("test");
|
||||||
|
if ( ! ret )
|
||||||
|
print "Return value false";
|
||||||
|
schedule 5secs { send_ready_for_data() };
|
||||||
|
schedule 10secs { second_test() };
|
||||||
|
}
|
||||||
|
|
||||||
|
event zeek_init() &priority=100
|
||||||
|
{
|
||||||
|
Broker::auto_publish(Cluster::worker_topic, ready_for_data);
|
||||||
|
}
|
||||||
|
|
||||||
|
global peer_count = 0;
|
||||||
|
|
||||||
|
event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
|
||||||
|
{
|
||||||
|
++peer_count;
|
||||||
|
|
||||||
|
if ( peer_count == 2 )
|
||||||
|
event cont_test();
|
||||||
|
}
|
||||||
|
|
||||||
|
@endif
|
|
@ -0,0 +1,60 @@
|
||||||
|
# @TEST-EXEC: btest-bg-run standalone zeek -b %INPUT
|
||||||
|
# @TEST-EXEC: btest-bg-wait 15
|
||||||
|
# @TEST-EXEC: btest-diff standalone/.stdout
|
||||||
|
|
||||||
|
@load base/frameworks/sumstats
|
||||||
|
|
||||||
|
redef exit_only_after_terminate=T;
|
||||||
|
|
||||||
|
event second_test()
|
||||||
|
{
|
||||||
|
SumStats::observe("test.metric", [$host=1.2.3.4], [$num=5]);
|
||||||
|
SumStats::observe("test.metric", [$host=1.2.3.4], [$num=22]);
|
||||||
|
SumStats::observe("test.metric", [$host=1.2.3.4], [$num=94]);
|
||||||
|
SumStats::observe("test.metric", [$host=1.2.3.4], [$num=50]);
|
||||||
|
SumStats::observe("test.metric", [$host=1.2.3.4], [$num=50]);
|
||||||
|
|
||||||
|
SumStats::observe("test.metric", [$host=6.5.4.3], [$num=2]);
|
||||||
|
SumStats::observe("test.metric", [$host=7.2.1.5], [$num=1]);
|
||||||
|
print "Performing second epoch with overvations";
|
||||||
|
local ret = SumStats::next_epoch("test");
|
||||||
|
if ( ! ret )
|
||||||
|
print "Return value false";
|
||||||
|
}
|
||||||
|
|
||||||
|
event cont_test()
|
||||||
|
{
|
||||||
|
print "Performing first epoch, no observations";
|
||||||
|
local ret = SumStats::next_epoch("test");
|
||||||
|
if ( ! ret )
|
||||||
|
print "Return value false";
|
||||||
|
schedule 2secs { second_test() };
|
||||||
|
}
|
||||||
|
|
||||||
|
event zeek_init() &priority=5
|
||||||
|
{
|
||||||
|
local r1: SumStats::Reducer = [$stream="test.metric",
|
||||||
|
$apply=set(SumStats::SUM,
|
||||||
|
SumStats::VARIANCE,
|
||||||
|
SumStats::AVERAGE,
|
||||||
|
SumStats::MAX,
|
||||||
|
SumStats::MIN,
|
||||||
|
SumStats::STD_DEV,
|
||||||
|
SumStats::UNIQUE,
|
||||||
|
SumStats::HLL_UNIQUE)];
|
||||||
|
SumStats::create([$name="test",
|
||||||
|
$epoch=0secs,
|
||||||
|
$reducers=set(r1),
|
||||||
|
$epoch_result(ts: time, key: SumStats::Key, result: SumStats::Result) =
|
||||||
|
{
|
||||||
|
local r = result["test.metric"];
|
||||||
|
print fmt("Host: %s - num:%d - sum:%.1f - var:%.1f - avg:%.1f - max:%.1f - min:%.1f - std_dev:%.1f - unique:%d - hllunique:%d", key$host, r$num, r$sum, r$variance, r$average, r$max, r$min, r$std_dev, r$unique, r$hll_unique);
|
||||||
|
terminate();
|
||||||
|
},
|
||||||
|
$epoch_finished(ts: time) =
|
||||||
|
{
|
||||||
|
print "epoch_finished";
|
||||||
|
}]);
|
||||||
|
|
||||||
|
schedule 1secs { cont_test() };
|
||||||
|
}
|
Loading…
Add table
Add a link
Reference in a new issue