2005-04-16 22:20:36 +00:00
|
|
|
/*
|
|
|
|
* ip_vs_est.c: simple rate estimator for IPVS
|
|
|
|
*
|
|
|
|
* Authors: Wensong Zhang <wensong@linuxvirtualserver.org>
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version
|
|
|
|
* 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
2011-01-03 13:44:54 +00:00
|
|
|
* Changes: Hans Schillstrom <hans.schillstrom@ericsson.com>
|
|
|
|
* Network name space (netns) aware.
|
|
|
|
* Global data moved to netns i.e struct netns_ipvs
|
|
|
|
* Affected data: est_list and est_lock.
|
|
|
|
* estimation_timer() runs with timer per netns.
|
|
|
|
* get_stats()) do the per cpu summing.
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
2009-07-30 21:29:44 +00:00
|
|
|
|
|
|
|
#define KMSG_COMPONENT "IPVS"
|
|
|
|
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
#include <linux/kernel.h>
|
2005-12-27 04:43:12 +00:00
|
|
|
#include <linux/jiffies.h>
|
2005-04-16 22:20:36 +00:00
|
|
|
#include <linux/types.h>
|
2006-01-05 20:14:43 +00:00
|
|
|
#include <linux/interrupt.h>
|
2008-01-12 10:33:50 +00:00
|
|
|
#include <linux/sysctl.h>
|
2008-08-10 18:24:41 +00:00
|
|
|
#include <linux/list.h>
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
#include <net/ip_vs.h>
|
|
|
|
|
|
|
|
/*
|
|
|
|
This code is to estimate rate in a shorter interval (such as 8
|
|
|
|
seconds) for virtual services and real servers. For measure rate in a
|
|
|
|
long interval, it is easy to implement a user level daemon which
|
|
|
|
periodically reads those statistical counters and measure rate.
|
|
|
|
|
|
|
|
Currently, the measurement is activated by slow timer handler. Hope
|
|
|
|
this measurement will not introduce too much load.
|
|
|
|
|
|
|
|
We measure rate during the last 8 seconds every 2 seconds:
|
|
|
|
|
|
|
|
avgrate = avgrate*(1-W) + rate*W
|
|
|
|
|
|
|
|
where W = 2^(-2)
|
|
|
|
|
|
|
|
NOTES.
|
|
|
|
|
|
|
|
* The stored value for average bps is scaled by 2^5, so that maximal
|
|
|
|
rate is ~2.15Gbits/s, average pps and cps are scaled by 2^10.
|
|
|
|
|
|
|
|
* A lot code is taken from net/sched/estimator.c
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
2011-01-03 13:44:56 +00:00
|
|
|
/*
|
|
|
|
* Make a summary from each cpu
|
|
|
|
*/
|
|
|
|
static void ip_vs_read_cpu_stats(struct ip_vs_stats_user *sum,
|
|
|
|
struct ip_vs_cpu_stats *stats)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for_each_possible_cpu(i) {
|
|
|
|
struct ip_vs_cpu_stats *s = per_cpu_ptr(stats, i);
|
|
|
|
unsigned int start;
|
|
|
|
__u64 inbytes, outbytes;
|
|
|
|
if (i) {
|
|
|
|
sum->conns += s->ustats.conns;
|
|
|
|
sum->inpkts += s->ustats.inpkts;
|
|
|
|
sum->outpkts += s->ustats.outpkts;
|
|
|
|
do {
|
|
|
|
start = u64_stats_fetch_begin_bh(&s->syncp);
|
|
|
|
inbytes = s->ustats.inbytes;
|
|
|
|
outbytes = s->ustats.outbytes;
|
|
|
|
} while (u64_stats_fetch_retry_bh(&s->syncp, start));
|
|
|
|
sum->inbytes += inbytes;
|
|
|
|
sum->outbytes += outbytes;
|
|
|
|
} else {
|
|
|
|
sum->conns = s->ustats.conns;
|
|
|
|
sum->inpkts = s->ustats.inpkts;
|
|
|
|
sum->outpkts = s->ustats.outpkts;
|
|
|
|
do {
|
|
|
|
start = u64_stats_fetch_begin_bh(&s->syncp);
|
|
|
|
sum->inbytes = s->ustats.inbytes;
|
|
|
|
sum->outbytes = s->ustats.outbytes;
|
|
|
|
} while (u64_stats_fetch_retry_bh(&s->syncp, start));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
static void estimation_timer(unsigned long arg)
|
|
|
|
{
|
|
|
|
struct ip_vs_estimator *e;
|
|
|
|
struct ip_vs_stats *s;
|
|
|
|
u32 n_conns;
|
|
|
|
u32 n_inpkts, n_outpkts;
|
|
|
|
u64 n_inbytes, n_outbytes;
|
|
|
|
u32 rate;
|
2011-01-03 13:44:54 +00:00
|
|
|
struct net *net = (struct net *)arg;
|
|
|
|
struct netns_ipvs *ipvs;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
ipvs = net_ipvs(net);
|
2011-01-03 13:44:56 +00:00
|
|
|
ip_vs_read_cpu_stats(&ipvs->tot_stats->ustats, ipvs->cpustats);
|
2011-01-03 13:44:54 +00:00
|
|
|
spin_lock(&ipvs->est_lock);
|
|
|
|
list_for_each_entry(e, &ipvs->est_list, list) {
|
2008-08-10 18:24:41 +00:00
|
|
|
s = container_of(e, struct ip_vs_stats, est);
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:56 +00:00
|
|
|
ip_vs_read_cpu_stats(&s->ustats, s->cpustats);
|
2005-04-16 22:20:36 +00:00
|
|
|
spin_lock(&s->lock);
|
2008-09-08 11:39:04 +00:00
|
|
|
n_conns = s->ustats.conns;
|
|
|
|
n_inpkts = s->ustats.inpkts;
|
|
|
|
n_outpkts = s->ustats.outpkts;
|
|
|
|
n_inbytes = s->ustats.inbytes;
|
|
|
|
n_outbytes = s->ustats.outbytes;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
/* scaled by 2^10, but divided 2 seconds */
|
2011-01-03 13:44:54 +00:00
|
|
|
rate = (n_conns - e->last_conns) << 9;
|
2005-04-16 22:20:36 +00:00
|
|
|
e->last_conns = n_conns;
|
2011-01-03 13:44:54 +00:00
|
|
|
e->cps += ((long)rate - (long)e->cps) >> 2;
|
|
|
|
s->ustats.cps = (e->cps + 0x1FF) >> 10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
rate = (n_inpkts - e->last_inpkts) << 9;
|
2005-04-16 22:20:36 +00:00
|
|
|
e->last_inpkts = n_inpkts;
|
2011-01-03 13:44:54 +00:00
|
|
|
e->inpps += ((long)rate - (long)e->inpps) >> 2;
|
|
|
|
s->ustats.inpps = (e->inpps + 0x1FF) >> 10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
rate = (n_outpkts - e->last_outpkts) << 9;
|
2005-04-16 22:20:36 +00:00
|
|
|
e->last_outpkts = n_outpkts;
|
2011-01-03 13:44:54 +00:00
|
|
|
e->outpps += ((long)rate - (long)e->outpps) >> 2;
|
|
|
|
s->ustats.outpps = (e->outpps + 0x1FF) >> 10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
rate = (n_inbytes - e->last_inbytes) << 4;
|
2005-04-16 22:20:36 +00:00
|
|
|
e->last_inbytes = n_inbytes;
|
2011-01-03 13:44:54 +00:00
|
|
|
e->inbps += ((long)rate - (long)e->inbps) >> 2;
|
|
|
|
s->ustats.inbps = (e->inbps + 0xF) >> 5;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
rate = (n_outbytes - e->last_outbytes) << 4;
|
2005-04-16 22:20:36 +00:00
|
|
|
e->last_outbytes = n_outbytes;
|
2011-01-03 13:44:54 +00:00
|
|
|
e->outbps += ((long)rate - (long)e->outbps) >> 2;
|
|
|
|
s->ustats.outbps = (e->outbps + 0xF) >> 5;
|
2005-04-16 22:20:36 +00:00
|
|
|
spin_unlock(&s->lock);
|
|
|
|
}
|
2011-01-03 13:44:54 +00:00
|
|
|
spin_unlock(&ipvs->est_lock);
|
|
|
|
mod_timer(&ipvs->est_timer, jiffies + 2*HZ);
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
void ip_vs_new_estimator(struct net *net, struct ip_vs_stats *stats)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2011-01-03 13:44:54 +00:00
|
|
|
struct netns_ipvs *ipvs = net_ipvs(net);
|
2008-08-10 18:24:41 +00:00
|
|
|
struct ip_vs_estimator *est = &stats->est;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-08-10 18:24:41 +00:00
|
|
|
INIT_LIST_HEAD(&est->list);
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-09-08 11:39:04 +00:00
|
|
|
est->last_conns = stats->ustats.conns;
|
|
|
|
est->cps = stats->ustats.cps<<10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-09-08 11:39:04 +00:00
|
|
|
est->last_inpkts = stats->ustats.inpkts;
|
|
|
|
est->inpps = stats->ustats.inpps<<10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-09-08 11:39:04 +00:00
|
|
|
est->last_outpkts = stats->ustats.outpkts;
|
|
|
|
est->outpps = stats->ustats.outpps<<10;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-09-08 11:39:04 +00:00
|
|
|
est->last_inbytes = stats->ustats.inbytes;
|
|
|
|
est->inbps = stats->ustats.inbps<<5;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2008-09-08 11:39:04 +00:00
|
|
|
est->last_outbytes = stats->ustats.outbytes;
|
|
|
|
est->outbps = stats->ustats.outbps<<5;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
spin_lock_bh(&ipvs->est_lock);
|
|
|
|
list_add(&est->list, &ipvs->est_list);
|
|
|
|
spin_unlock_bh(&ipvs->est_lock);
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
void ip_vs_kill_estimator(struct net *net, struct ip_vs_stats *stats)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2011-01-03 13:44:54 +00:00
|
|
|
struct netns_ipvs *ipvs = net_ipvs(net);
|
2008-08-10 18:24:41 +00:00
|
|
|
struct ip_vs_estimator *est = &stats->est;
|
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
spin_lock_bh(&ipvs->est_lock);
|
2008-08-10 18:24:41 +00:00
|
|
|
list_del(&est->list);
|
2011-01-03 13:44:54 +00:00
|
|
|
spin_unlock_bh(&ipvs->est_lock);
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ip_vs_zero_estimator(struct ip_vs_stats *stats)
|
|
|
|
{
|
2008-08-10 18:24:41 +00:00
|
|
|
struct ip_vs_estimator *est = &stats->est;
|
|
|
|
|
|
|
|
/* set counters zero, caller must hold the stats->lock lock */
|
|
|
|
est->last_inbytes = 0;
|
|
|
|
est->last_outbytes = 0;
|
|
|
|
est->last_conns = 0;
|
|
|
|
est->last_inpkts = 0;
|
|
|
|
est->last_outpkts = 0;
|
|
|
|
est->cps = 0;
|
|
|
|
est->inpps = 0;
|
|
|
|
est->outpps = 0;
|
|
|
|
est->inbps = 0;
|
|
|
|
est->outbps = 0;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
2008-08-13 22:47:16 +00:00
|
|
|
|
2011-01-03 13:44:42 +00:00
|
|
|
static int __net_init __ip_vs_estimator_init(struct net *net)
|
|
|
|
{
|
2011-01-03 13:44:54 +00:00
|
|
|
struct netns_ipvs *ipvs = net_ipvs(net);
|
|
|
|
|
|
|
|
INIT_LIST_HEAD(&ipvs->est_list);
|
|
|
|
spin_lock_init(&ipvs->est_lock);
|
|
|
|
setup_timer(&ipvs->est_timer, estimation_timer, (unsigned long)net);
|
|
|
|
mod_timer(&ipvs->est_timer, jiffies + 2 * HZ);
|
2011-01-03 13:44:42 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-01-03 13:44:54 +00:00
|
|
|
static void __net_exit __ip_vs_estimator_exit(struct net *net)
|
|
|
|
{
|
|
|
|
del_timer_sync(&net_ipvs(net)->est_timer);
|
|
|
|
}
|
2011-01-03 13:44:42 +00:00
|
|
|
static struct pernet_operations ip_vs_app_ops = {
|
|
|
|
.init = __ip_vs_estimator_init,
|
2011-01-03 13:44:54 +00:00
|
|
|
.exit = __ip_vs_estimator_exit,
|
2011-01-03 13:44:42 +00:00
|
|
|
};
|
|
|
|
|
2008-08-13 22:47:16 +00:00
|
|
|
int __init ip_vs_estimator_init(void)
|
|
|
|
{
|
2011-01-03 13:44:42 +00:00
|
|
|
int rv;
|
|
|
|
|
|
|
|
rv = register_pernet_subsys(&ip_vs_app_ops);
|
|
|
|
return rv;
|
2008-08-13 22:47:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ip_vs_estimator_cleanup(void)
|
|
|
|
{
|
2011-01-03 13:44:42 +00:00
|
|
|
unregister_pernet_subsys(&ip_vs_app_ops);
|
2008-08-13 22:47:16 +00:00
|
|
|
}
|