dummynet.c revision 204591
1187769Sluigi/*
2204591Sluigi * Copyright (c) 2002-2003,2010 Luigi Rizzo
3187769Sluigi *
4187769Sluigi * Redistribution and use in source forms, with and without modification,
5187769Sluigi * are permitted provided that this entire comment appears intact.
6187769Sluigi *
7187769Sluigi * Redistribution in binary form may occur without any restrictions.
8187769Sluigi * Obviously, it would be nice if you gave credit where credit is due
9187769Sluigi * but requiring it would be too onerous.
10187769Sluigi *
11187769Sluigi * This software is provided ``AS IS'' without any warranties of any kind.
12187769Sluigi *
13187769Sluigi * NEW command line interface for IP firewall facility
14187769Sluigi *
15187769Sluigi * $FreeBSD: head/sbin/ipfw/dummynet.c 204591 2010-03-02 17:40:48Z luigi $
16187769Sluigi *
17187769Sluigi * dummynet support
18187769Sluigi */
19187769Sluigi
20187769Sluigi#include <sys/types.h>
21187769Sluigi#include <sys/socket.h>
22187983Sluigi/* XXX there are several sysctl leftover here */
23187769Sluigi#include <sys/sysctl.h>
24187769Sluigi
25187769Sluigi#include "ipfw2.h"
26187769Sluigi
27187769Sluigi#include <ctype.h>
28187769Sluigi#include <err.h>
29194930Soleg#include <errno.h>
30194930Soleg#include <libutil.h>
31187769Sluigi#include <netdb.h>
32187769Sluigi#include <stdio.h>
33187769Sluigi#include <stdlib.h>
34187769Sluigi#include <string.h>
35187769Sluigi#include <sysexits.h>
36187769Sluigi
37187769Sluigi#include <net/if.h>
38187769Sluigi#include <netinet/in.h>
39187769Sluigi#include <netinet/ip_fw.h>
40187769Sluigi#include <netinet/ip_dummynet.h>
41187983Sluigi#include <arpa/inet.h>	/* inet_ntoa */
42187769Sluigi
43204591Sluigi
44187769Sluigistatic struct _s_x dummynet_params[] = {
45187769Sluigi	{ "plr",		TOK_PLR },
46187769Sluigi	{ "noerror",		TOK_NOERROR },
47187769Sluigi	{ "buckets",		TOK_BUCKETS },
48187769Sluigi	{ "dst-ip",		TOK_DSTIP },
49187769Sluigi	{ "src-ip",		TOK_SRCIP },
50187769Sluigi	{ "dst-port",		TOK_DSTPORT },
51187769Sluigi	{ "src-port",		TOK_SRCPORT },
52187769Sluigi	{ "proto",		TOK_PROTO },
53187769Sluigi	{ "weight",		TOK_WEIGHT },
54204591Sluigi	{ "lmax",		TOK_LMAX },
55204591Sluigi	{ "maxlen",		TOK_LMAX },
56187769Sluigi	{ "all",		TOK_ALL },
57204591Sluigi	{ "mask",		TOK_MASK }, /* alias for both */
58204591Sluigi	{ "sched_mask",		TOK_SCHED_MASK },
59204591Sluigi	{ "flow_mask",		TOK_FLOW_MASK },
60187769Sluigi	{ "droptail",		TOK_DROPTAIL },
61187769Sluigi	{ "red",		TOK_RED },
62187769Sluigi	{ "gred",		TOK_GRED },
63187769Sluigi	{ "bw",			TOK_BW },
64187769Sluigi	{ "bandwidth",		TOK_BW },
65187769Sluigi	{ "delay",		TOK_DELAY },
66204591Sluigi	{ "link",		TOK_LINK },
67187769Sluigi	{ "pipe",		TOK_PIPE },
68187769Sluigi	{ "queue",		TOK_QUEUE },
69204591Sluigi	{ "flowset",		TOK_FLOWSET },
70204591Sluigi	{ "sched",		TOK_SCHED },
71204591Sluigi	{ "pri",		TOK_PRI },
72204591Sluigi	{ "priority",		TOK_PRI },
73204591Sluigi	{ "type",		TOK_TYPE },
74187769Sluigi	{ "flow-id",		TOK_FLOWID},
75187769Sluigi	{ "dst-ipv6",		TOK_DSTIP6},
76187769Sluigi	{ "dst-ip6",		TOK_DSTIP6},
77187769Sluigi	{ "src-ipv6",		TOK_SRCIP6},
78187769Sluigi	{ "src-ip6",		TOK_SRCIP6},
79204591Sluigi	{ "profile",		TOK_PROFILE},
80194930Soleg	{ "burst",		TOK_BURST},
81187769Sluigi	{ "dummynet-params",	TOK_NULL },
82187769Sluigi	{ NULL, 0 }	/* terminator */
83187769Sluigi};
84187769Sluigi
85204591Sluigi#define O_NEXT(p, len) ((void *)((char *)p + len))
86204591Sluigi
87204591Sluigistatic void
88204591Sluigioid_fill(struct dn_id *oid, int len, int type, uintptr_t id)
89204591Sluigi{
90204591Sluigi	oid->len = len;
91204591Sluigi	oid->type = type;
92204591Sluigi	oid->subtype = 0;
93204591Sluigi	oid->id = id;
94204591Sluigi}
95204591Sluigi
96204591Sluigi/* make room in the buffer and move the pointer forward */
97204591Sluigistatic void *
98204591Sluigio_next(struct dn_id **o, int len, int type)
99204591Sluigi{
100204591Sluigi	struct dn_id *ret = *o;
101204591Sluigi	oid_fill(ret, len, type, 0);
102204591Sluigi	*o = O_NEXT(*o, len);
103204591Sluigi	return ret;
104204591Sluigi}
105204591Sluigi
106204591Sluigi#if 0
107187769Sluigistatic int
108200056Sluigisort_q(void *arg, const void *pa, const void *pb)
109187769Sluigi{
110187769Sluigi	int rev = (co.do_sort < 0);
111187769Sluigi	int field = rev ? -co.do_sort : co.do_sort;
112187769Sluigi	long long res = 0;
113187769Sluigi	const struct dn_flow_queue *a = pa;
114187769Sluigi	const struct dn_flow_queue *b = pb;
115187769Sluigi
116187769Sluigi	switch (field) {
117187769Sluigi	case 1: /* pkts */
118187769Sluigi		res = a->len - b->len;
119187769Sluigi		break;
120187769Sluigi	case 2: /* bytes */
121187769Sluigi		res = a->len_bytes - b->len_bytes;
122187769Sluigi		break;
123187769Sluigi
124187769Sluigi	case 3: /* tot pkts */
125187769Sluigi		res = a->tot_pkts - b->tot_pkts;
126187769Sluigi		break;
127187769Sluigi
128187769Sluigi	case 4: /* tot bytes */
129187769Sluigi		res = a->tot_bytes - b->tot_bytes;
130187769Sluigi		break;
131187769Sluigi	}
132187769Sluigi	if (res < 0)
133187769Sluigi		res = -1;
134187769Sluigi	if (res > 0)
135187769Sluigi		res = 1;
136187769Sluigi	return (int)(rev ? res : -res);
137187769Sluigi}
138204591Sluigi#endif
139187769Sluigi
140204591Sluigi/* print a mask and header for the subsequent list of flows */
141187769Sluigistatic void
142204591Sluigiprint_mask(struct ipfw_flow_id *id)
143187769Sluigi{
144204591Sluigi	if (!IS_IP6_FLOW_ID(id)) {
145204591Sluigi		printf("    "
146204591Sluigi		    "mask: 0x%02x 0x%08x/0x%04x -> 0x%08x/0x%04x\n",
147204591Sluigi		    id->proto,
148204591Sluigi		    id->src_ip, id->src_port,
149204591Sluigi		    id->dst_ip, id->dst_port);
150187769Sluigi
151204591Sluigi		printf("BKT Prot ___Source IP/port____ "
152204591Sluigi		    "____Dest. IP/port____ "
153204591Sluigi		    "Tot_pkt/bytes Pkt/Byte Drp\n");
154204591Sluigi	} else {
155204591Sluigi		char buf[255];
156204591Sluigi		printf("\n        mask: proto: 0x%02x, flow_id: 0x%08x,  ",
157204591Sluigi		    id->proto, id->flow_id6);
158204591Sluigi		inet_ntop(AF_INET6, &(id->src_ip6), buf, sizeof(buf));
159204591Sluigi		printf("%s/0x%04x -> ", buf, id->src_port);
160204591Sluigi		inet_ntop(AF_INET6, &(id->dst_ip6), buf, sizeof(buf));
161204591Sluigi		printf("%s/0x%04x\n", buf, id->dst_port);
162187769Sluigi
163204591Sluigi		printf("BKT ___Prot___ _flow-id_ "
164204591Sluigi		    "______________Source IPv6/port_______________ "
165204591Sluigi		    "_______________Dest. IPv6/port_______________ "
166204591Sluigi		    "Tot_pkt/bytes Pkt/Byte Drp\n");
167204591Sluigi	}
168204591Sluigi}
169187769Sluigi
170204591Sluigistatic void
171204591Sluigilist_flow(struct dn_flow *ni)
172204591Sluigi{
173204591Sluigi	char buff[255];
174204591Sluigi	struct protoent *pe;
175204591Sluigi	struct in_addr ina;
176204591Sluigi	struct ipfw_flow_id *id = &ni->fid;
177187769Sluigi
178204591Sluigi	pe = getprotobynumber(id->proto);
179187769Sluigi		/* XXX: Should check for IPv4 flows */
180204591Sluigi	printf("%3u ", (ni->oid.id) & 0xff);
181204591Sluigi	if (!IS_IP6_FLOW_ID(id)) {
182187769Sluigi		if (pe)
183187769Sluigi			printf("%-4s ", pe->p_name);
184187769Sluigi		else
185204591Sluigi			printf("%4u ", id->proto);
186204591Sluigi		ina.s_addr = htonl(id->src_ip);
187187769Sluigi		printf("%15s/%-5d ",
188204591Sluigi		    inet_ntoa(ina), id->src_port);
189204591Sluigi		ina.s_addr = htonl(id->dst_ip);
190187769Sluigi		printf("%15s/%-5d ",
191204591Sluigi		    inet_ntoa(ina), id->dst_port);
192204591Sluigi	} else {
193204591Sluigi		/* Print IPv6 flows */
194187769Sluigi		if (pe != NULL)
195187769Sluigi			printf("%9s ", pe->p_name);
196187769Sluigi		else
197204591Sluigi			printf("%9u ", id->proto);
198204591Sluigi		printf("%7d  %39s/%-5d ", id->flow_id6,
199204591Sluigi		    inet_ntop(AF_INET6, &(id->src_ip6), buff, sizeof(buff)),
200204591Sluigi		    id->src_port);
201187769Sluigi		printf(" %39s/%-5d ",
202204591Sluigi		    inet_ntop(AF_INET6, &(id->dst_ip6), buff, sizeof(buff)),
203204591Sluigi		    id->dst_port);
204187769Sluigi	}
205204591Sluigi	printf("%4llu %8llu %2u %4u %3u\n",
206204591Sluigi	    align_uint64(&ni->tot_pkts),
207204591Sluigi	    align_uint64(&ni->tot_bytes),
208204591Sluigi	    ni->length, ni->len_bytes, ni->drops);
209187769Sluigi}
210187769Sluigi
211187769Sluigistatic void
212204591Sluigiprint_flowset_parms(struct dn_fs *fs, char *prefix)
213187769Sluigi{
214187769Sluigi	int l;
215187769Sluigi	char qs[30];
216187769Sluigi	char plr[30];
217187769Sluigi	char red[90];	/* Display RED parameters */
218187769Sluigi
219187769Sluigi	l = fs->qsize;
220204591Sluigi	if (fs->flags & DN_QSIZE_BYTES) {
221187769Sluigi		if (l >= 8192)
222187769Sluigi			sprintf(qs, "%d KB", l / 1024);
223187769Sluigi		else
224187769Sluigi			sprintf(qs, "%d B", l);
225187769Sluigi	} else
226187769Sluigi		sprintf(qs, "%3d sl.", l);
227187769Sluigi	if (fs->plr)
228187769Sluigi		sprintf(plr, "plr %f", 1.0 * fs->plr / (double)(0x7fffffff));
229187769Sluigi	else
230187769Sluigi		plr[0] = '\0';
231204591Sluigi
232204591Sluigi	if (fs->flags & DN_IS_RED)	/* RED parameters */
233187769Sluigi		sprintf(red,
234194930Soleg		    "\n\t %cRED w_q %f min_th %d max_th %d max_p %f",
235204591Sluigi		    (fs->flags & DN_IS_GENTLE_RED) ? 'G' : ' ',
236187769Sluigi		    1.0 * fs->w_q / (double)(1 << SCALE_RED),
237204591Sluigi		    fs->min_th,
238204591Sluigi		    fs->max_th,
239187769Sluigi		    1.0 * fs->max_p / (double)(1 << SCALE_RED));
240187769Sluigi	else
241187769Sluigi		sprintf(red, "droptail");
242187769Sluigi
243204591Sluigi	if (prefix[0]) {
244204591Sluigi	    printf("%s %s%s %d queues (%d buckets) %s\n",
245204591Sluigi		prefix, qs, plr, fs->oid.id, fs->buckets, red);
246204591Sluigi	    prefix[0] = '\0';
247204591Sluigi	} else {
248204591Sluigi	    printf("q%05d %s%s %d flows (%d buckets) sched %d "
249204591Sluigi			"weight %d lmax %d pri %d %s\n",
250204591Sluigi		fs->fs_nr, qs, plr, fs->oid.id, fs->buckets,
251204591Sluigi		fs->sched_nr, fs->par[0], fs->par[1], fs->par[2], red);
252204591Sluigi	    if (fs->flags & DN_HAVE_MASK)
253204591Sluigi		print_mask(&fs->flow_mask);
254204591Sluigi	}
255187769Sluigi}
256187769Sluigi
257190865Sluigistatic void
258204591Sluigiprint_extra_delay_parms(struct dn_profile *p)
259190865Sluigi{
260190865Sluigi	double loss;
261190865Sluigi	if (p->samples_no <= 0)
262190865Sluigi		return;
263190865Sluigi
264190865Sluigi	loss = p->loss_level;
265190865Sluigi	loss /= p->samples_no;
266194930Soleg	printf("\t profile: name \"%s\" loss %f samples %d\n",
267194930Soleg		p->name, loss, p->samples_no);
268190865Sluigi}
269190865Sluigi
270204591Sluigistatic void
271204591Sluigiflush_buf(char *buf)
272187769Sluigi{
273204591Sluigi	if (buf[0])
274204591Sluigi		printf("%s\n", buf);
275204591Sluigi	buf[0] = '\0';
276204591Sluigi}
277204591Sluigi
278204591Sluigi/*
279204591Sluigi * generic list routine. We expect objects in a specific order, i.e.
280204591Sluigi * PIPES AND SCHEDULERS:
281204591Sluigi *	link; scheduler; internal flowset if any; instances
282204591Sluigi * we can tell a pipe from the number.
283204591Sluigi *
284204591Sluigi * FLOWSETS:
285204591Sluigi *	flowset; queues;
286204591Sluigi * link i (int queue); scheduler i; si(i) { flowsets() : queues }
287204591Sluigi */
288204591Sluigistatic void
289204591Sluigilist_pipes(struct dn_id *oid, struct dn_id *end)
290204591Sluigi{
291204591Sluigi    char buf[160];	/* pending buffer */
292204591Sluigi    buf[0] = '\0';
293187769Sluigi
294204591Sluigi    for (; oid != end; oid = O_NEXT(oid, oid->len)) {
295204591Sluigi	if (oid->len < sizeof(*oid))
296204591Sluigi		errx(1, "invalid oid len %d\n", oid->len);
297187769Sluigi
298204591Sluigi	switch (oid->type) {
299204591Sluigi	default:
300204591Sluigi	    flush_buf(buf);
301204591Sluigi	    printf("unrecognized object %d size %d\n", oid->type, oid->len);
302204591Sluigi	    break;
303204591Sluigi	case DN_TEXT: /* list of attached flowsets */
304204591Sluigi	    {
305204591Sluigi		int i, l;
306204591Sluigi		struct {
307204591Sluigi			struct dn_id id;
308204591Sluigi			uint32_t p[0];
309204591Sluigi		} *d = (void *)oid;
310204591Sluigi		l = (oid->len - sizeof(*oid))/sizeof(d->p[0]);
311204591Sluigi		if (l == 0)
312204591Sluigi		    break;
313204591Sluigi		printf("   Children flowsets: ");
314204591Sluigi		for (i = 0; i < l; i++)
315204591Sluigi			printf("%u ", d->p[i]);
316204591Sluigi		printf("\n");
317204591Sluigi		break;
318204591Sluigi	    }
319204591Sluigi	case DN_CMD_GET:
320204591Sluigi	    if (co.verbose)
321204591Sluigi		printf("answer for cmd %d, len %d\n", oid->type, oid->id);
322204591Sluigi	    break;
323204591Sluigi	case DN_SCH: {
324204591Sluigi	    struct dn_sch *s = (struct dn_sch *)oid;
325204591Sluigi	    flush_buf(buf);
326204591Sluigi	    printf(" sched %d type %s flags 0x%x %d buckets %d active\n",
327204591Sluigi			s->sched_nr,
328204591Sluigi			s->name, s->flags, s->buckets, s->oid.id);
329204591Sluigi	    if (s->flags & DN_HAVE_MASK)
330204591Sluigi		print_mask(&s->sched_mask);
331204591Sluigi	    }
332204591Sluigi	    break;
333187769Sluigi
334204591Sluigi	case DN_FLOW:
335204591Sluigi	    list_flow((struct dn_flow *)oid);
336204591Sluigi	    break;
337187769Sluigi
338204591Sluigi	case DN_LINK: {
339204591Sluigi	    struct dn_link *p = (struct dn_link *)oid;
340204591Sluigi	    double b = p->bandwidth;
341204591Sluigi	    char bwbuf[30];
342204591Sluigi	    char burst[5 + 7];
343187769Sluigi
344204591Sluigi	    /* This starts a new object so flush buffer */
345204591Sluigi	    flush_buf(buf);
346204591Sluigi	    /* data rate */
347204591Sluigi	    if (b == 0)
348204591Sluigi		sprintf(bwbuf, "unlimited     ");
349204591Sluigi	    else if (b >= 1000000)
350204591Sluigi		sprintf(bwbuf, "%7.3f Mbit/s", b/1000000);
351204591Sluigi	    else if (b >= 1000)
352204591Sluigi		sprintf(bwbuf, "%7.3f Kbit/s", b/1000);
353204591Sluigi	    else
354204591Sluigi		sprintf(bwbuf, "%7.3f bit/s ", b);
355187769Sluigi
356204591Sluigi	    if (humanize_number(burst, sizeof(burst), p->burst,
357204591Sluigi		    "", HN_AUTOSCALE, 0) < 0 || co.verbose)
358204591Sluigi		sprintf(burst, "%d", (int)p->burst);
359204591Sluigi	    sprintf(buf, "%05d: %s %4d ms burst %s",
360204591Sluigi		p->link_nr % DN_MAX_ID, bwbuf, p->delay, burst);
361204591Sluigi	    }
362204591Sluigi	    break;
363190865Sluigi
364204591Sluigi	case DN_FS:
365204591Sluigi	    print_flowset_parms((struct dn_fs *)oid, buf);
366204591Sluigi	    break;
367204591Sluigi	case DN_PROFILE:
368204591Sluigi	    flush_buf(buf);
369204591Sluigi	    print_extra_delay_parms((struct dn_profile *)oid);
370187769Sluigi	}
371204591Sluigi	flush_buf(buf); // XXX does it really go here ?
372204591Sluigi    }
373187769Sluigi}
374187769Sluigi
375187769Sluigi/*
376204591Sluigi * Delete pipe, queue or scheduler i
377187769Sluigi */
378187769Sluigiint
379204591Sluigiipfw_delete_pipe(int do_pipe, int i)
380187769Sluigi{
381204591Sluigi	struct {
382204591Sluigi		struct dn_id oid;
383204591Sluigi		uintptr_t a[1];	/* add more if we want a list */
384204591Sluigi	} cmd;
385204591Sluigi	oid_fill((void *)&cmd, sizeof(cmd), DN_CMD_DELETE, DN_API_VERSION);
386204591Sluigi	cmd.oid.subtype = (do_pipe == 1) ? DN_LINK :
387204591Sluigi		( (do_pipe == 2) ? DN_FS : DN_SCH);
388204591Sluigi	cmd.a[0] = i;
389204591Sluigi	i = do_cmd(IP_DUMMYNET3, &cmd, cmd.oid.len);
390187769Sluigi	if (i) {
391187769Sluigi		i = 1;
392187769Sluigi		warn("rule %u: setsockopt(IP_DUMMYNET_DEL)", i);
393187769Sluigi	}
394187769Sluigi	return i;
395187769Sluigi}
396187769Sluigi
397190865Sluigi/*
398190865Sluigi * Code to parse delay profiles.
399190865Sluigi *
400190865Sluigi * Some link types introduce extra delays in the transmission
401190865Sluigi * of a packet, e.g. because of MAC level framing, contention on
402190865Sluigi * the use of the channel, MAC level retransmissions and so on.
403190865Sluigi * From our point of view, the channel is effectively unavailable
404190865Sluigi * for this extra time, which is constant or variable depending
405190865Sluigi * on the link type. Additionally, packets may be dropped after this
406190865Sluigi * time (e.g. on a wireless link after too many retransmissions).
407190865Sluigi * We can model the additional delay with an empirical curve
408190865Sluigi * that represents its distribution.
409190865Sluigi *
410190865Sluigi *	cumulative probability
411190865Sluigi *	1.0 ^
412190865Sluigi *	    |
413190865Sluigi *	L   +-- loss-level          x
414190865Sluigi *	    |                 ******
415190865Sluigi *	    |                *
416190865Sluigi *	    |           *****
417190865Sluigi *	    |          *
418190865Sluigi *	    |        **
419190865Sluigi *	    |       *
420190865Sluigi *	    +-------*------------------->
421190865Sluigi *			delay
422190865Sluigi *
423190865Sluigi * The empirical curve may have both vertical and horizontal lines.
424190865Sluigi * Vertical lines represent constant delay for a range of
425190865Sluigi * probabilities; horizontal lines correspond to a discontinuty
426204591Sluigi * in the delay distribution: the link will use the largest delay
427190865Sluigi * for a given probability.
428190865Sluigi *
429190865Sluigi * To pass the curve to dummynet, we must store the parameters
430190865Sluigi * in a file as described below, and issue the command
431190865Sluigi *
432190865Sluigi *      ipfw pipe <n> config ... bw XXX profile <filename> ...
433190865Sluigi *
434190865Sluigi * The file format is the following, with whitespace acting as
435190865Sluigi * a separator and '#' indicating the beginning a comment:
436190865Sluigi *
437190865Sluigi *	samples N
438190865Sluigi *		the number of samples used in the internal
439190865Sluigi *		representation (2..1024; default 100);
440190865Sluigi *
441190865Sluigi *	loss-level L
442190865Sluigi *		The probability above which packets are lost.
443190865Sluigi *               (0.0 <= L <= 1.0, default 1.0 i.e. no loss);
444190865Sluigi *
445190865Sluigi *	name identifier
446190865Sluigi *		Optional a name (listed by "ipfw pipe show")
447190865Sluigi *		to identify the distribution;
448190865Sluigi *
449190865Sluigi *	"delay prob" | "prob delay"
450190865Sluigi *		One of these two lines is mandatory and defines
451190865Sluigi *		the format of the following lines with data points.
452190865Sluigi *
453190865Sluigi *	XXX YYY
454190865Sluigi *		2 or more lines representing points in the curve,
455190865Sluigi *		with either delay or probability first, according
456190865Sluigi *		to the chosen format.
457190865Sluigi *		The unit for delay is milliseconds.
458190865Sluigi *
459190865Sluigi * Data points does not need to be ordered or equal to the number
460190865Sluigi * specified in the "samples" line. ipfw will sort and interpolate
461190865Sluigi * the curve as needed.
462190865Sluigi *
463190865Sluigi * Example of a profile file:
464190865Sluigi
465190865Sluigi        name    bla_bla_bla
466190865Sluigi        samples 100
467190865Sluigi        loss-level    0.86
468190865Sluigi        prob    delay
469190865Sluigi        0       200	# minimum overhead is 200ms
470190865Sluigi        0.5     200
471190865Sluigi        0.5     300
472190865Sluigi        0.8     1000
473190865Sluigi        0.9     1300
474190865Sluigi        1       1300
475190865Sluigi
476190865Sluigi * Internally, we will convert the curve to a fixed number of
477190865Sluigi * samples, and when it is time to transmit a packet we will
478190865Sluigi * model the extra delay as extra bits in the packet.
479190865Sluigi *
480190865Sluigi */
481190865Sluigi
482190865Sluigi#define ED_MAX_LINE_LEN	256+ED_MAX_NAME_LEN
483190865Sluigi#define ED_TOK_SAMPLES	"samples"
484190865Sluigi#define ED_TOK_LOSS	"loss-level"
485190865Sluigi#define ED_TOK_NAME	"name"
486190865Sluigi#define ED_TOK_DELAY	"delay"
487190865Sluigi#define ED_TOK_PROB	"prob"
488193715Sluigi#define ED_TOK_BW	"bw"
489190865Sluigi#define ED_SEPARATORS	" \t\n"
490190865Sluigi#define ED_MIN_SAMPLES_NO	2
491190865Sluigi
492190865Sluigi/*
493190865Sluigi * returns 1 if s is a non-negative number, with at least one '.'
494190865Sluigi */
495190865Sluigistatic int
496190865Sluigiis_valid_number(const char *s)
497190865Sluigi{
498190865Sluigi	int i, dots_found = 0;
499190865Sluigi	int len = strlen(s);
500190865Sluigi
501190865Sluigi	for (i = 0; i<len; ++i)
502190865Sluigi		if (!isdigit(s[i]) && (s[i] !='.' || ++dots_found > 1))
503190865Sluigi			return 0;
504190865Sluigi	return 1;
505190865Sluigi}
506190865Sluigi
507193715Sluigi/*
508193715Sluigi * Take as input a string describing a bandwidth value
509193715Sluigi * and return the numeric bandwidth value.
510193715Sluigi * set clocking interface or bandwidth value
511193715Sluigi */
512200056Sluigistatic void
513193715Sluigiread_bandwidth(char *arg, int *bandwidth, char *if_name, int namelen)
514193715Sluigi{
515193715Sluigi	if (*bandwidth != -1)
516204591Sluigi		warnx("duplicate token, override bandwidth value!");
517193715Sluigi
518193715Sluigi	if (arg[0] >= 'a' && arg[0] <= 'z') {
519204591Sluigi		if (!if_name) {
520204591Sluigi			errx(1, "no if support");
521204591Sluigi		}
522193715Sluigi		if (namelen >= IFNAMSIZ)
523193715Sluigi			warn("interface name truncated");
524193715Sluigi		namelen--;
525193715Sluigi		/* interface name */
526193715Sluigi		strncpy(if_name, arg, namelen);
527193715Sluigi		if_name[namelen] = '\0';
528193715Sluigi		*bandwidth = 0;
529193715Sluigi	} else {	/* read bandwidth value */
530193715Sluigi		int bw;
531193715Sluigi		char *end = NULL;
532193715Sluigi
533193715Sluigi		bw = strtoul(arg, &end, 0);
534193715Sluigi		if (*end == 'K' || *end == 'k') {
535193715Sluigi			end++;
536193715Sluigi			bw *= 1000;
537193715Sluigi		} else if (*end == 'M') {
538193715Sluigi			end++;
539193715Sluigi			bw *= 1000000;
540193715Sluigi		}
541193715Sluigi		if ((*end == 'B' &&
542193715Sluigi			_substrcmp2(end, "Bi", "Bit/s") != 0) ||
543193715Sluigi		    _substrcmp2(end, "by", "bytes") == 0)
544193715Sluigi			bw *= 8;
545193715Sluigi
546193715Sluigi		if (bw < 0)
547193715Sluigi			errx(EX_DATAERR, "bandwidth too large");
548193715Sluigi
549193715Sluigi		*bandwidth = bw;
550204591Sluigi		if (if_name)
551204591Sluigi			if_name[0] = '\0';
552193715Sluigi	}
553193715Sluigi}
554193715Sluigi
555190865Sluigistruct point {
556190865Sluigi	double prob;
557190865Sluigi	double delay;
558190865Sluigi};
559190865Sluigi
560200056Sluigistatic int
561190865Sluigicompare_points(const void *vp1, const void *vp2)
562190865Sluigi{
563190865Sluigi	const struct point *p1 = vp1;
564190865Sluigi	const struct point *p2 = vp2;
565190865Sluigi	double res = 0;
566190865Sluigi
567190865Sluigi	res = p1->prob - p2->prob;
568190865Sluigi	if (res == 0)
569190865Sluigi		res = p1->delay - p2->delay;
570190865Sluigi	if (res < 0)
571190865Sluigi		return -1;
572190865Sluigi	else if (res > 0)
573190865Sluigi		return 1;
574190865Sluigi	else
575190865Sluigi		return 0;
576190865Sluigi}
577190865Sluigi
578190865Sluigi#define ED_EFMT(s) EX_DATAERR,"error in %s at line %d: "#s,filename,lineno
579190865Sluigi
580190865Sluigistatic void
581204591Sluigiload_extra_delays(const char *filename, struct dn_profile *p,
582204591Sluigi	struct dn_link *link)
583190865Sluigi{
584190865Sluigi	char    line[ED_MAX_LINE_LEN];
585190865Sluigi	FILE    *f;
586190865Sluigi	int     lineno = 0;
587190865Sluigi	int     i;
588190865Sluigi
589190865Sluigi	int     samples = -1;
590190865Sluigi	double  loss = -1.0;
591190865Sluigi	char    profile_name[ED_MAX_NAME_LEN];
592190865Sluigi	int     delay_first = -1;
593190865Sluigi	int     do_points = 0;
594190865Sluigi	struct point    points[ED_MAX_SAMPLES_NO];
595190865Sluigi	int     points_no = 0;
596190865Sluigi
597204591Sluigi	/* XXX link never NULL? */
598204591Sluigi	p->link_nr = link->link_nr;
599204591Sluigi
600190865Sluigi	profile_name[0] = '\0';
601190865Sluigi	f = fopen(filename, "r");
602190865Sluigi	if (f == NULL)
603190865Sluigi		err(EX_UNAVAILABLE, "fopen: %s", filename);
604190865Sluigi
605190865Sluigi	while (fgets(line, ED_MAX_LINE_LEN, f)) {         /* read commands */
606190865Sluigi		char *s, *cur = line, *name = NULL, *arg = NULL;
607190865Sluigi
608190865Sluigi		++lineno;
609190865Sluigi
610190865Sluigi		/* parse the line */
611190865Sluigi		while (cur) {
612190865Sluigi			s = strsep(&cur, ED_SEPARATORS);
613190865Sluigi			if (s == NULL || *s == '#')
614190865Sluigi				break;
615190865Sluigi			if (*s == '\0')
616190865Sluigi				continue;
617190865Sluigi			if (arg)
618190865Sluigi				errx(ED_EFMT("too many arguments"));
619190865Sluigi			if (name == NULL)
620190865Sluigi				name = s;
621190865Sluigi			else
622190865Sluigi				arg = s;
623190865Sluigi		}
624190865Sluigi		if (name == NULL)	/* empty line */
625190865Sluigi			continue;
626190865Sluigi		if (arg == NULL)
627190865Sluigi			errx(ED_EFMT("missing arg for %s"), name);
628190865Sluigi
629190865Sluigi		if (!strcasecmp(name, ED_TOK_SAMPLES)) {
630190865Sluigi		    if (samples > 0)
631190865Sluigi			errx(ED_EFMT("duplicate ``samples'' line"));
632190865Sluigi		    if (atoi(arg) <=0)
633190865Sluigi			errx(ED_EFMT("invalid number of samples"));
634190865Sluigi		    samples = atoi(arg);
635190865Sluigi		    if (samples>ED_MAX_SAMPLES_NO)
636190865Sluigi			    errx(ED_EFMT("too many samples, maximum is %d"),
637190865Sluigi				ED_MAX_SAMPLES_NO);
638190865Sluigi		    do_points = 0;
639193715Sluigi		} else if (!strcasecmp(name, ED_TOK_BW)) {
640204591Sluigi		    char buf[IFNAMSIZ];
641204591Sluigi		    read_bandwidth(arg, &link->bandwidth, buf, sizeof(buf));
642190865Sluigi		} else if (!strcasecmp(name, ED_TOK_LOSS)) {
643190865Sluigi		    if (loss != -1.0)
644190865Sluigi			errx(ED_EFMT("duplicated token: %s"), name);
645190865Sluigi		    if (!is_valid_number(arg))
646190865Sluigi			errx(ED_EFMT("invalid %s"), arg);
647190865Sluigi		    loss = atof(arg);
648190865Sluigi		    if (loss > 1)
649190865Sluigi			errx(ED_EFMT("%s greater than 1.0"), name);
650190865Sluigi		    do_points = 0;
651190865Sluigi		} else if (!strcasecmp(name, ED_TOK_NAME)) {
652190865Sluigi		    if (profile_name[0] != '\0')
653190865Sluigi			errx(ED_EFMT("duplicated token: %s"), name);
654190865Sluigi		    strncpy(profile_name, arg, sizeof(profile_name) - 1);
655190865Sluigi		    profile_name[sizeof(profile_name)-1] = '\0';
656190865Sluigi		    do_points = 0;
657190865Sluigi		} else if (!strcasecmp(name, ED_TOK_DELAY)) {
658190865Sluigi		    if (do_points)
659190865Sluigi			errx(ED_EFMT("duplicated token: %s"), name);
660190865Sluigi		    delay_first = 1;
661190865Sluigi		    do_points = 1;
662190865Sluigi		} else if (!strcasecmp(name, ED_TOK_PROB)) {
663190865Sluigi		    if (do_points)
664190865Sluigi			errx(ED_EFMT("duplicated token: %s"), name);
665190865Sluigi		    delay_first = 0;
666190865Sluigi		    do_points = 1;
667190865Sluigi		} else if (do_points) {
668190865Sluigi		    if (!is_valid_number(name) || !is_valid_number(arg))
669190865Sluigi			errx(ED_EFMT("invalid point found"));
670190865Sluigi		    if (delay_first) {
671190865Sluigi			points[points_no].delay = atof(name);
672190865Sluigi			points[points_no].prob = atof(arg);
673190865Sluigi		    } else {
674190865Sluigi			points[points_no].delay = atof(arg);
675190865Sluigi			points[points_no].prob = atof(name);
676190865Sluigi		    }
677190865Sluigi		    if (points[points_no].prob > 1.0)
678190865Sluigi			errx(ED_EFMT("probability greater than 1.0"));
679190865Sluigi		    ++points_no;
680190865Sluigi		} else {
681190865Sluigi		    errx(ED_EFMT("unrecognised command '%s'"), name);
682190865Sluigi		}
683190865Sluigi	}
684190865Sluigi
685199626Snetchild	fclose (f);
686199626Snetchild
687190865Sluigi	if (samples == -1) {
688190865Sluigi	    warnx("'%s' not found, assuming 100", ED_TOK_SAMPLES);
689190865Sluigi	    samples = 100;
690190865Sluigi	}
691190865Sluigi
692190865Sluigi	if (loss == -1.0) {
693190865Sluigi	    warnx("'%s' not found, assuming no loss", ED_TOK_LOSS);
694190865Sluigi	    loss = 1;
695190865Sluigi	}
696190865Sluigi
697190865Sluigi	/* make sure that there are enough points. */
698190865Sluigi	if (points_no < ED_MIN_SAMPLES_NO)
699190865Sluigi	    errx(ED_EFMT("too few samples, need at least %d"),
700190865Sluigi		ED_MIN_SAMPLES_NO);
701190865Sluigi
702190865Sluigi	qsort(points, points_no, sizeof(struct point), compare_points);
703190865Sluigi
704190865Sluigi	/* interpolation */
705190865Sluigi	for (i = 0; i<points_no-1; ++i) {
706190865Sluigi	    double y1 = points[i].prob * samples;
707190865Sluigi	    double x1 = points[i].delay;
708190865Sluigi	    double y2 = points[i+1].prob * samples;
709190865Sluigi	    double x2 = points[i+1].delay;
710190865Sluigi
711204591Sluigi	    int ix = y1;
712190865Sluigi	    int stop = y2;
713190865Sluigi
714190865Sluigi	    if (x1 == x2) {
715204591Sluigi		for (; ix<stop; ++ix)
716204591Sluigi		    p->samples[ix] = x1;
717190865Sluigi	    } else {
718190865Sluigi		double m = (y2-y1)/(x2-x1);
719190865Sluigi		double c = y1 - m*x1;
720204591Sluigi		for (; ix<stop ; ++ix)
721204591Sluigi		    p->samples[ix] = (ix - c)/m;
722190865Sluigi	    }
723190865Sluigi	}
724190865Sluigi	p->samples_no = samples;
725190865Sluigi	p->loss_level = loss * samples;
726190865Sluigi	strncpy(p->name, profile_name, sizeof(p->name));
727190865Sluigi}
728190865Sluigi
729204591Sluigi/*
730204591Sluigi * configuration of pipes, schedulers, flowsets.
731204591Sluigi * When we configure a new scheduler, an empty pipe is created, so:
732204591Sluigi *
733204591Sluigi * do_pipe = 1 -> "pipe N config ..." only for backward compatibility
734204591Sluigi *	sched N+Delta type fifo sched_mask ...
735204591Sluigi *	pipe N+Delta <parameters>
736204591Sluigi *	flowset N+Delta pipe N+Delta (no parameters)
737204591Sluigi *	sched N type wf2q+ sched_mask ...
738204591Sluigi *	pipe N <parameters>
739204591Sluigi *
740204591Sluigi * do_pipe = 2 -> flowset N config
741204591Sluigi *	flowset N parameters
742204591Sluigi *
743204591Sluigi * do_pipe = 3 -> sched N config
744204591Sluigi *	sched N parameters (default no pipe)
745204591Sluigi *	optional Pipe N config ...
746204591Sluigi * pipe ==>
747204591Sluigi */
748187769Sluigivoid
749187769Sluigiipfw_config_pipe(int ac, char **av)
750187769Sluigi{
751204591Sluigi	int i, j;
752187769Sluigi	char *end;
753187769Sluigi	void *par = NULL;
754204591Sluigi	struct dn_id *buf, *base;
755204591Sluigi	struct dn_sch *sch = NULL;
756204591Sluigi	struct dn_link *p = NULL;
757204591Sluigi	struct dn_fs *fs = NULL;
758204591Sluigi	struct dn_profile *pf = NULL;
759204591Sluigi	struct ipfw_flow_id *mask = NULL;
760204591Sluigi	int lmax;
761204591Sluigi	uint32_t _foo = 0, *flags = &_foo , *buckets = &_foo;
762187769Sluigi
763204591Sluigi	/*
764204591Sluigi	 * allocate space for 1 header,
765204591Sluigi	 * 1 scheduler, 1 link, 1 flowset, 1 profile
766204591Sluigi	 */
767204591Sluigi	lmax = sizeof(struct dn_id);	/* command header */
768204591Sluigi	lmax += sizeof(struct dn_sch) + sizeof(struct dn_link) +
769204591Sluigi		sizeof(struct dn_fs) + sizeof(struct dn_profile);
770187769Sluigi
771187769Sluigi	av++; ac--;
772187769Sluigi	/* Pipe number */
773187769Sluigi	if (ac && isdigit(**av)) {
774187769Sluigi		i = atoi(*av); av++; ac--;
775204591Sluigi	} else
776204591Sluigi		i = -1;
777204591Sluigi	if (i <= 0)
778204591Sluigi		errx(EX_USAGE, "need a pipe/flowset/sched number");
779204591Sluigi	base = buf = safe_calloc(1, lmax);
780204591Sluigi	/* all commands start with a 'CONFIGURE' and a version */
781204591Sluigi	o_next(&buf, sizeof(struct dn_id), DN_CMD_CONFIG);
782204591Sluigi	base->id = DN_API_VERSION;
783204591Sluigi
784204591Sluigi	switch (co.do_pipe) {
785204591Sluigi	case 1: /* "pipe N config ..." */
786204591Sluigi		/* Allocate space for the WF2Q+ scheduler, its link
787204591Sluigi		 * and the FIFO flowset. Set the number, but leave
788204591Sluigi		 * the scheduler subtype and other parameters to 0
789204591Sluigi		 * so the kernel will use appropriate defaults.
790204591Sluigi		 * XXX todo: add a flag to record if a parameter
791204591Sluigi		 * is actually configured.
792204591Sluigi		 * If we do a 'pipe config' mask -> sched_mask.
793204591Sluigi		 * The FIFO scheduler and link are derived from the
794204591Sluigi		 * WF2Q+ one in the kernel.
795204591Sluigi		 */
796204591Sluigi		sch = o_next(&buf, sizeof(*sch), DN_SCH);
797204591Sluigi		p = o_next(&buf, sizeof(*p), DN_LINK);
798204591Sluigi		fs = o_next(&buf, sizeof(*fs), DN_FS);
799204591Sluigi
800204591Sluigi		sch->sched_nr = i;
801204591Sluigi		sch->oid.subtype = 0;	/* defaults to WF2Q+ */
802204591Sluigi		mask = &sch->sched_mask;
803204591Sluigi		flags = &sch->flags;
804204591Sluigi		buckets = &sch->buckets;
805204591Sluigi		*flags |= DN_PIPE_CMD;
806204591Sluigi
807204591Sluigi		p->link_nr = i;
808204591Sluigi
809204591Sluigi		/* This flowset is only for the FIFO scheduler */
810204591Sluigi		fs->fs_nr = i + 2*DN_MAX_ID;
811204591Sluigi		fs->sched_nr = i + DN_MAX_ID;
812204591Sluigi		break;
813204591Sluigi
814204591Sluigi	case 2: /* "queue N config ... " */
815204591Sluigi		fs = o_next(&buf, sizeof(*fs), DN_FS);
816204591Sluigi		fs->fs_nr = i;
817204591Sluigi		mask = &fs->flow_mask;
818204591Sluigi		flags = &fs->flags;
819204591Sluigi		buckets = &fs->buckets;
820204591Sluigi		break;
821204591Sluigi
822204591Sluigi	case 3: /* "sched N config ..." */
823204591Sluigi		sch = o_next(&buf, sizeof(*sch), DN_SCH);
824204591Sluigi		fs = o_next(&buf, sizeof(*fs), DN_FS);
825204591Sluigi		sch->sched_nr = i;
826204591Sluigi		mask = &sch->sched_mask;
827204591Sluigi		flags = &sch->flags;
828204591Sluigi		buckets = &sch->buckets;
829204591Sluigi		/* fs is used only with !MULTIQUEUE schedulers */
830204591Sluigi		fs->fs_nr = i + DN_MAX_ID;
831204591Sluigi		fs->sched_nr = i;
832204591Sluigi		break;
833187769Sluigi	}
834204591Sluigi	/* set to -1 those fields for which we want to reuse existing
835204591Sluigi	 * values from the kernel.
836204591Sluigi	 * Also, *_nr and subtype = 0 mean reuse the value from the kernel.
837204591Sluigi	 * XXX todo: support reuse of the mask.
838204591Sluigi	 */
839204591Sluigi	if (p)
840204591Sluigi		p->bandwidth = -1;
841204591Sluigi	for (j = 0; j < sizeof(fs->par)/sizeof(fs->par[0]); j++)
842204591Sluigi		fs->par[j] = -1;
843187769Sluigi	while (ac > 0) {
844187769Sluigi		double d;
845187769Sluigi		int tok = match_token(dummynet_params, *av);
846187769Sluigi		ac--; av++;
847187769Sluigi
848187769Sluigi		switch(tok) {
849187769Sluigi		case TOK_NOERROR:
850204591Sluigi			NEED(fs, "noerror is only for pipes");
851204591Sluigi			fs->flags |= DN_NOERROR;
852187769Sluigi			break;
853187769Sluigi
854187769Sluigi		case TOK_PLR:
855204591Sluigi			NEED(fs, "plr is only for pipes");
856187769Sluigi			NEED1("plr needs argument 0..1\n");
857187769Sluigi			d = strtod(av[0], NULL);
858187769Sluigi			if (d > 1)
859187769Sluigi				d = 1;
860187769Sluigi			else if (d < 0)
861187769Sluigi				d = 0;
862204591Sluigi			fs->plr = (int)(d*0x7fffffff);
863187769Sluigi			ac--; av++;
864187769Sluigi			break;
865187769Sluigi
866187769Sluigi		case TOK_QUEUE:
867204591Sluigi			NEED(fs, "queue is only for pipes or flowsets");
868187769Sluigi			NEED1("queue needs queue size\n");
869187769Sluigi			end = NULL;
870204591Sluigi			fs->qsize = strtoul(av[0], &end, 0);
871187769Sluigi			if (*end == 'K' || *end == 'k') {
872204591Sluigi				fs->flags |= DN_QSIZE_BYTES;
873204591Sluigi				fs->qsize *= 1024;
874187769Sluigi			} else if (*end == 'B' ||
875187769Sluigi			    _substrcmp2(end, "by", "bytes") == 0) {
876204591Sluigi				fs->flags |= DN_QSIZE_BYTES;
877187769Sluigi			}
878187769Sluigi			ac--; av++;
879187769Sluigi			break;
880187769Sluigi
881187769Sluigi		case TOK_BUCKETS:
882204591Sluigi			NEED(fs, "buckets is only for pipes or flowsets");
883187769Sluigi			NEED1("buckets needs argument\n");
884204591Sluigi			*buckets = strtoul(av[0], NULL, 0);
885187769Sluigi			ac--; av++;
886187769Sluigi			break;
887187769Sluigi
888204591Sluigi		case TOK_FLOW_MASK:
889204591Sluigi		case TOK_SCHED_MASK:
890187769Sluigi		case TOK_MASK:
891204591Sluigi			NEED(mask, "tok_mask");
892187769Sluigi			NEED1("mask needs mask specifier\n");
893187769Sluigi			/*
894187769Sluigi			 * per-flow queue, mask is dst_ip, dst_port,
895187769Sluigi			 * src_ip, src_port, proto measured in bits
896187769Sluigi			 */
897187769Sluigi			par = NULL;
898187769Sluigi
899204591Sluigi			bzero(mask, sizeof(*mask));
900187769Sluigi			end = NULL;
901187769Sluigi
902187769Sluigi			while (ac >= 1) {
903187769Sluigi			    uint32_t *p32 = NULL;
904187769Sluigi			    uint16_t *p16 = NULL;
905187769Sluigi			    uint32_t *p20 = NULL;
906187769Sluigi			    struct in6_addr *pa6 = NULL;
907187769Sluigi			    uint32_t a;
908187769Sluigi
909187769Sluigi			    tok = match_token(dummynet_params, *av);
910187769Sluigi			    ac--; av++;
911187769Sluigi			    switch(tok) {
912187769Sluigi			    case TOK_ALL:
913187769Sluigi				    /*
914187769Sluigi				     * special case, all bits significant
915187769Sluigi				     */
916204591Sluigi				    mask->dst_ip = ~0;
917204591Sluigi				    mask->src_ip = ~0;
918204591Sluigi				    mask->dst_port = ~0;
919204591Sluigi				    mask->src_port = ~0;
920204591Sluigi				    mask->proto = ~0;
921204591Sluigi				    n2mask(&mask->dst_ip6, 128);
922204591Sluigi				    n2mask(&mask->src_ip6, 128);
923204591Sluigi				    mask->flow_id6 = ~0;
924204591Sluigi				    *flags |= DN_HAVE_MASK;
925187769Sluigi				    goto end_mask;
926187769Sluigi
927187769Sluigi			    case TOK_DSTIP:
928204591Sluigi				    mask->addr_type = 4;
929204591Sluigi				    p32 = &mask->dst_ip;
930187769Sluigi				    break;
931187769Sluigi
932187769Sluigi			    case TOK_SRCIP:
933204591Sluigi				    mask->addr_type = 4;
934204591Sluigi				    p32 = &mask->src_ip;
935187769Sluigi				    break;
936187769Sluigi
937187769Sluigi			    case TOK_DSTIP6:
938204591Sluigi				    mask->addr_type = 6;
939204591Sluigi				    pa6 = &mask->dst_ip6;
940187769Sluigi				    break;
941187769Sluigi
942187769Sluigi			    case TOK_SRCIP6:
943204591Sluigi				    mask->addr_type = 6;
944204591Sluigi				    pa6 = &mask->src_ip6;
945187769Sluigi				    break;
946187769Sluigi
947187769Sluigi			    case TOK_FLOWID:
948204591Sluigi				    mask->addr_type = 6;
949204591Sluigi				    p20 = &mask->flow_id6;
950187769Sluigi				    break;
951187769Sluigi
952187769Sluigi			    case TOK_DSTPORT:
953204591Sluigi				    p16 = &mask->dst_port;
954187769Sluigi				    break;
955187769Sluigi
956187769Sluigi			    case TOK_SRCPORT:
957204591Sluigi				    p16 = &mask->src_port;
958187769Sluigi				    break;
959187769Sluigi
960187769Sluigi			    case TOK_PROTO:
961187769Sluigi				    break;
962187769Sluigi
963187769Sluigi			    default:
964187769Sluigi				    ac++; av--; /* backtrack */
965187769Sluigi				    goto end_mask;
966187769Sluigi			    }
967187769Sluigi			    if (ac < 1)
968187769Sluigi				    errx(EX_USAGE, "mask: value missing");
969187769Sluigi			    if (*av[0] == '/') {
970187769Sluigi				    a = strtoul(av[0]+1, &end, 0);
971187769Sluigi				    if (pa6 == NULL)
972187769Sluigi					    a = (a == 32) ? ~0 : (1 << a) - 1;
973187769Sluigi			    } else
974187769Sluigi				    a = strtoul(av[0], &end, 0);
975187769Sluigi			    if (p32 != NULL)
976187769Sluigi				    *p32 = a;
977187769Sluigi			    else if (p16 != NULL) {
978187769Sluigi				    if (a > 0xFFFF)
979187769Sluigi					    errx(EX_DATAERR,
980187769Sluigi						"port mask must be 16 bit");
981187769Sluigi				    *p16 = (uint16_t)a;
982187769Sluigi			    } else if (p20 != NULL) {
983187769Sluigi				    if (a > 0xfffff)
984187769Sluigi					errx(EX_DATAERR,
985187769Sluigi					    "flow_id mask must be 20 bit");
986187769Sluigi				    *p20 = (uint32_t)a;
987187769Sluigi			    } else if (pa6 != NULL) {
988187769Sluigi				    if (a > 128)
989187769Sluigi					errx(EX_DATAERR,
990187769Sluigi					    "in6addr invalid mask len");
991187769Sluigi				    else
992187769Sluigi					n2mask(pa6, a);
993187769Sluigi			    } else {
994187769Sluigi				    if (a > 0xFF)
995187769Sluigi					    errx(EX_DATAERR,
996187769Sluigi						"proto mask must be 8 bit");
997204591Sluigi				    fs->flow_mask.proto = (uint8_t)a;
998187769Sluigi			    }
999187769Sluigi			    if (a != 0)
1000204591Sluigi				    *flags |= DN_HAVE_MASK;
1001187769Sluigi			    ac--; av++;
1002187769Sluigi			} /* end while, config masks */
1003187769Sluigiend_mask:
1004187769Sluigi			break;
1005187769Sluigi
1006187769Sluigi		case TOK_RED:
1007187769Sluigi		case TOK_GRED:
1008187769Sluigi			NEED1("red/gred needs w_q/min_th/max_th/max_p\n");
1009204591Sluigi			fs->flags |= DN_IS_RED;
1010187769Sluigi			if (tok == TOK_GRED)
1011204591Sluigi				fs->flags |= DN_IS_GENTLE_RED;
1012187769Sluigi			/*
1013187769Sluigi			 * the format for parameters is w_q/min_th/max_th/max_p
1014187769Sluigi			 */
1015187769Sluigi			if ((end = strsep(&av[0], "/"))) {
1016187769Sluigi			    double w_q = strtod(end, NULL);
1017187769Sluigi			    if (w_q > 1 || w_q <= 0)
1018187769Sluigi				errx(EX_DATAERR, "0 < w_q <= 1");
1019204591Sluigi			    fs->w_q = (int) (w_q * (1 << SCALE_RED));
1020187769Sluigi			}
1021187769Sluigi			if ((end = strsep(&av[0], "/"))) {
1022204591Sluigi			    fs->min_th = strtoul(end, &end, 0);
1023187769Sluigi			    if (*end == 'K' || *end == 'k')
1024204591Sluigi				fs->min_th *= 1024;
1025187769Sluigi			}
1026187769Sluigi			if ((end = strsep(&av[0], "/"))) {
1027204591Sluigi			    fs->max_th = strtoul(end, &end, 0);
1028187769Sluigi			    if (*end == 'K' || *end == 'k')
1029204591Sluigi				fs->max_th *= 1024;
1030187769Sluigi			}
1031187769Sluigi			if ((end = strsep(&av[0], "/"))) {
1032187769Sluigi			    double max_p = strtod(end, NULL);
1033187769Sluigi			    if (max_p > 1 || max_p <= 0)
1034187769Sluigi				errx(EX_DATAERR, "0 < max_p <= 1");
1035204591Sluigi			    fs->max_p = (int)(max_p * (1 << SCALE_RED));
1036187769Sluigi			}
1037187769Sluigi			ac--; av++;
1038187769Sluigi			break;
1039187769Sluigi
1040187769Sluigi		case TOK_DROPTAIL:
1041204591Sluigi			NEED(fs, "droptail is only for flowsets");
1042204591Sluigi			fs->flags &= ~(DN_IS_RED|DN_IS_GENTLE_RED);
1043187769Sluigi			break;
1044187769Sluigi
1045187769Sluigi		case TOK_BW:
1046204591Sluigi			NEED(p, "bw is only for links");
1047187769Sluigi			NEED1("bw needs bandwidth or interface\n");
1048204591Sluigi			read_bandwidth(av[0], &p->bandwidth, NULL, 0);
1049187769Sluigi			ac--; av++;
1050187769Sluigi			break;
1051187769Sluigi
1052187769Sluigi		case TOK_DELAY:
1053204591Sluigi			NEED(p, "delay is only for links");
1054187769Sluigi			NEED1("delay needs argument 0..10000ms\n");
1055204591Sluigi			p->delay = strtoul(av[0], NULL, 0);
1056187769Sluigi			ac--; av++;
1057187769Sluigi			break;
1058187769Sluigi
1059204591Sluigi		case TOK_TYPE: {
1060204591Sluigi			int l;
1061204591Sluigi			NEED(sch, "type is only for schedulers");
1062204591Sluigi			NEED1("type needs a string");
1063204591Sluigi			l = strlen(av[0]);
1064204591Sluigi			if (l == 0 || l > 15)
1065204591Sluigi				errx(1, "type %s too long\n", av[0]);
1066204591Sluigi			strcpy(sch->name, av[0]);
1067204591Sluigi			sch->oid.subtype = 0; /* use string */
1068204591Sluigi			ac--; av++;
1069204591Sluigi			break;
1070204591Sluigi		    }
1071204591Sluigi
1072187769Sluigi		case TOK_WEIGHT:
1073204591Sluigi			NEED(fs, "weight is only for flowsets");
1074204591Sluigi			NEED1("weight needs argument\n");
1075204591Sluigi			fs->par[0] = strtol(av[0], &end, 0);
1076187769Sluigi			ac--; av++;
1077187769Sluigi			break;
1078187769Sluigi
1079204591Sluigi		case TOK_LMAX:
1080204591Sluigi			NEED(fs, "lmax is only for flowsets");
1081204591Sluigi			NEED1("lmax needs argument\n");
1082204591Sluigi			fs->par[1] = strtol(av[0], &end, 0);
1083204591Sluigi			ac--; av++;
1084204591Sluigi			break;
1085204591Sluigi
1086204591Sluigi		case TOK_PRI:
1087204591Sluigi			NEED(fs, "priority is only for flowsets");
1088204591Sluigi			NEED1("priority needs argument\n");
1089204591Sluigi			fs->par[2] = strtol(av[0], &end, 0);
1090204591Sluigi			ac--; av++;
1091204591Sluigi			break;
1092204591Sluigi
1093204591Sluigi		case TOK_SCHED:
1094187769Sluigi		case TOK_PIPE:
1095204591Sluigi			NEED(fs, "pipe/sched");
1096204591Sluigi			NEED1("pipe/link/sched needs number\n");
1097204591Sluigi			fs->sched_nr = strtoul(av[0], &end, 0);
1098187769Sluigi			ac--; av++;
1099187769Sluigi			break;
1100187769Sluigi
1101204591Sluigi		case TOK_PROFILE:
1102204591Sluigi			NEED((!pf), "profile already set");
1103204591Sluigi			NEED(p, "profile");
1104204591Sluigi		    {
1105190865Sluigi			NEED1("extra delay needs the file name\n");
1106204591Sluigi			pf = o_next(&buf, sizeof(*pf), DN_PROFILE);
1107204591Sluigi			load_extra_delays(av[0], pf, p); //XXX can't fail?
1108190865Sluigi			--ac; ++av;
1109204591Sluigi		    }
1110190865Sluigi			break;
1111190865Sluigi
1112194930Soleg		case TOK_BURST:
1113204591Sluigi			NEED(p, "burst");
1114194930Soleg			NEED1("burst needs argument\n");
1115194930Soleg			errno = 0;
1116204591Sluigi			if (expand_number(av[0], (int64_t *)&p->burst) < 0)
1117194930Soleg				if (errno != ERANGE)
1118194930Soleg					errx(EX_DATAERR,
1119194930Soleg					    "burst: invalid argument");
1120204591Sluigi			if (errno || p->burst > (1ULL << 48) - 1)
1121194930Soleg				errx(EX_DATAERR,
1122194930Soleg				    "burst: out of range (0..2^48-1)");
1123194930Soleg			ac--; av++;
1124194930Soleg			break;
1125194930Soleg
1126187769Sluigi		default:
1127187769Sluigi			errx(EX_DATAERR, "unrecognised option ``%s''", av[-1]);
1128187769Sluigi		}
1129187769Sluigi	}
1130204591Sluigi
1131204591Sluigi	/* check validity of parameters */
1132204591Sluigi	if (p) {
1133204591Sluigi		if (p->delay > 10000)
1134187769Sluigi			errx(EX_DATAERR, "delay must be < 10000");
1135204591Sluigi		if (p->bandwidth == -1)
1136204591Sluigi			p->bandwidth = 0;
1137187769Sluigi	}
1138204591Sluigi	if (fs) {
1139204591Sluigi		/* XXX accept a 0 scheduler to keep the default */
1140204591Sluigi	    if (fs->flags & DN_QSIZE_BYTES) {
1141187769Sluigi		size_t len;
1142187769Sluigi		long limit;
1143187769Sluigi
1144187769Sluigi		len = sizeof(limit);
1145187769Sluigi		if (sysctlbyname("net.inet.ip.dummynet.pipe_byte_limit",
1146187769Sluigi			&limit, &len, NULL, 0) == -1)
1147187769Sluigi			limit = 1024*1024;
1148204591Sluigi		if (fs->qsize > limit)
1149187769Sluigi			errx(EX_DATAERR, "queue size must be < %ldB", limit);
1150204591Sluigi	    } else {
1151187769Sluigi		size_t len;
1152187769Sluigi		long limit;
1153187769Sluigi
1154187769Sluigi		len = sizeof(limit);
1155187769Sluigi		if (sysctlbyname("net.inet.ip.dummynet.pipe_slot_limit",
1156187769Sluigi			&limit, &len, NULL, 0) == -1)
1157187769Sluigi			limit = 100;
1158204591Sluigi		if (fs->qsize > limit)
1159187769Sluigi			errx(EX_DATAERR, "2 <= queue size <= %ld", limit);
1160204591Sluigi	    }
1161204591Sluigi
1162204591Sluigi	    if (fs->flags & DN_IS_RED) {
1163187769Sluigi		size_t len;
1164187769Sluigi		int lookup_depth, avg_pkt_size;
1165204591Sluigi		double w_q;
1166187769Sluigi
1167204591Sluigi		if (fs->min_th >= fs->max_th)
1168187769Sluigi		    errx(EX_DATAERR, "min_th %d must be < than max_th %d",
1169204591Sluigi			fs->min_th, fs->max_th);
1170204591Sluigi		if (fs->max_th == 0)
1171187769Sluigi		    errx(EX_DATAERR, "max_th must be > 0");
1172187769Sluigi
1173187769Sluigi		len = sizeof(int);
1174187769Sluigi		if (sysctlbyname("net.inet.ip.dummynet.red_lookup_depth",
1175187769Sluigi			&lookup_depth, &len, NULL, 0) == -1)
1176204591Sluigi			lookup_depth = 256;
1177187769Sluigi		if (lookup_depth == 0)
1178187769Sluigi		    errx(EX_DATAERR, "net.inet.ip.dummynet.red_lookup_depth"
1179187769Sluigi			" must be greater than zero");
1180187769Sluigi
1181187769Sluigi		len = sizeof(int);
1182187769Sluigi		if (sysctlbyname("net.inet.ip.dummynet.red_avg_pkt_size",
1183187769Sluigi			&avg_pkt_size, &len, NULL, 0) == -1)
1184204591Sluigi			avg_pkt_size = 512;
1185187769Sluigi
1186187769Sluigi		if (avg_pkt_size == 0)
1187187769Sluigi			errx(EX_DATAERR,
1188187769Sluigi			    "net.inet.ip.dummynet.red_avg_pkt_size must"
1189187769Sluigi			    " be greater than zero");
1190187769Sluigi
1191187769Sluigi		/*
1192187769Sluigi		 * Ticks needed for sending a medium-sized packet.
1193187769Sluigi		 * Unfortunately, when we are configuring a WF2Q+ queue, we
1194187769Sluigi		 * do not have bandwidth information, because that is stored
1195187769Sluigi		 * in the parent pipe, and also we have multiple queues
1196187769Sluigi		 * competing for it. So we set s=0, which is not very
1197187769Sluigi		 * correct. But on the other hand, why do we want RED with
1198187769Sluigi		 * WF2Q+ ?
1199187769Sluigi		 */
1200204591Sluigi#if 0
1201187769Sluigi		if (p.bandwidth==0) /* this is a WF2Q+ queue */
1202187769Sluigi			s = 0;
1203187769Sluigi		else
1204187769Sluigi			s = (double)ck.hz * avg_pkt_size * 8 / p.bandwidth;
1205204591Sluigi#endif
1206187769Sluigi		/*
1207187769Sluigi		 * max idle time (in ticks) before avg queue size becomes 0.
1208187769Sluigi		 * NOTA:  (3/w_q) is approx the value x so that
1209187769Sluigi		 * (1-w_q)^x < 10^-3.
1210187769Sluigi		 */
1211204591Sluigi		w_q = ((double)fs->w_q) / (1 << SCALE_RED);
1212204591Sluigi#if 0 // go in kernel
1213187769Sluigi		idle = s * 3. / w_q;
1214204591Sluigi		fs->lookup_step = (int)idle / lookup_depth;
1215204591Sluigi		if (!fs->lookup_step)
1216204591Sluigi			fs->lookup_step = 1;
1217187769Sluigi		weight = 1 - w_q;
1218204591Sluigi		for (t = fs->lookup_step; t > 1; --t)
1219187769Sluigi			weight *= 1 - w_q;
1220204591Sluigi		fs->lookup_weight = (int)(weight * (1 << SCALE_RED));
1221204591Sluigi#endif
1222204591Sluigi	    }
1223187769Sluigi	}
1224190865Sluigi
1225204591Sluigi	i = do_cmd(IP_DUMMYNET3, base, (char *)buf - (char *)base);
1226190865Sluigi
1227187769Sluigi	if (i)
1228187769Sluigi		err(1, "setsockopt(%s)", "IP_DUMMYNET_CONFIGURE");
1229187769Sluigi}
1230204591Sluigi
1231204591Sluigivoid
1232204591Sluigidummynet_flush(void)
1233204591Sluigi{
1234204591Sluigi	struct dn_id oid;
1235204591Sluigi	oid_fill(&oid, sizeof(oid), DN_CMD_FLUSH, DN_API_VERSION);
1236204591Sluigi	do_cmd(IP_DUMMYNET3, &oid, oid.len);
1237204591Sluigi}
1238204591Sluigi
1239204591Sluigi/* main entry point for dummynet list functions. co.do_pipe indicates
1240204591Sluigi * which function we want to support.
1241204591Sluigi * XXX todo- accept filtering arguments.
1242204591Sluigi */
1243204591Sluigivoid
1244204591Sluigidummynet_list(int ac, char *av[], int show_counters)
1245204591Sluigi{
1246204591Sluigi	struct dn_id oid, *x;
1247204591Sluigi	int ret, l = sizeof(oid);
1248204591Sluigi
1249204591Sluigi	oid_fill(&oid, l, DN_CMD_GET, DN_API_VERSION);
1250204591Sluigi	switch (co.do_pipe) {
1251204591Sluigi	case 1:
1252204591Sluigi		oid.subtype = DN_LINK;	/* list pipe */
1253204591Sluigi		break;
1254204591Sluigi	case 2:
1255204591Sluigi		oid.subtype = DN_FS;	/* list queue */
1256204591Sluigi		break;
1257204591Sluigi	case 3:
1258204591Sluigi		oid.subtype = DN_SCH;	/* list sched */
1259204591Sluigi		break;
1260204591Sluigi	}
1261204591Sluigi	ret = do_cmd(-IP_DUMMYNET3, &oid, (uintptr_t)&l);
1262204591Sluigi	// printf("%s returns %d need %d\n", __FUNCTION__, ret, oid.id);
1263204591Sluigi	if (ret != 0 || oid.id <= sizeof(oid))
1264204591Sluigi		return;
1265204591Sluigi	l = oid.id;
1266204591Sluigi	x = safe_calloc(1, l);
1267204591Sluigi	*x = oid;
1268204591Sluigi	ret = do_cmd(-IP_DUMMYNET3, x, (uintptr_t)&l);
1269204591Sluigi	// printf("%s returns %d need %d\n", __FUNCTION__, ret, oid.id);
1270204591Sluigi	// XXX filter on ac, av
1271204591Sluigi	list_pipes(x, O_NEXT(x, l));
1272204591Sluigi	free(x);
1273204591Sluigi}
1274