5 include/linux/pkt_sched.h | 518 ++++++++++++++++++++++++++++++++++++++++++++++
9 tc/q_htb.c | 308 +++++++++++++++++++++++++++
10 tc/q_wrr.c | 322 ++++++++++++++++++++++++++++
11 9 files changed, 1177 insertions(+), 5 deletions(-)
13 --- iproute2-2.6.35.orig/doc/ip-cref.tex
14 +++ iproute2-2.6.35/doc/ip-cref.tex
15 @@ -1307,6 +1307,19 @@ peers are allowed to send to us.
16 --- \threeonly the clamp for congestion window. It is ignored if the \verb|lock|
19 +\item \verb|hoplimit NUMBER|
21 +--- [2.5.74+ only] Hop limit on the path to this destination. If it is not
22 + given, Linux uses the value selected with \verb|sysctl| variable
23 + \verb|net/ipv4/ip_default_ttl|.
25 +\item \verb|initcwnd NUMBER|
27 +--- [2.5.70+ only] Initial congestion window size when establishing
28 + connections to this destination. This value is multiplied with the
29 + MSS (``Maximal Segment Size'') for the connection to get the actual
30 + window size. If it is not given (or set to zero), Linux uses the
31 + values specified in~\cite{RFC2414}.
33 \item \verb|advmss NUMBER|
35 @@ -2664,6 +2677,9 @@ http://www.cisco.com/univercd/cc/td/doc/
37 \bibitem{RFC2414} M.~Allman, S.~Floyd, C.~Partridge.
38 ``Increasing TCP's Initial Window'', RFC-2414.
40 +\bibitem{RFC2414} M.~Allman, S.~Floyd, C.~Partridge.
41 +``Increasing TCP's Initial Window'', RFC-2414.
45 --- iproute2-2.6.35.orig/doc/Makefile
46 +++ iproute2-2.6.35/doc/Makefile
47 @@ -14,6 +14,7 @@ PAGESIZE=a4
50 HTMLFILES=$(subst .sgml,.html,$(shell echo *.sgml))
51 +TXTFILES=$(subst .sgml,.txt,$(shell echo *.sgml))
52 DVIFILES=$(subst .ps,.dvi,$(PSFILES))
55 @@ -23,6 +24,8 @@ pstwocol: $(PSFILES)
64 @@ -47,9 +50,12 @@ print: $(PSFILES)
69 + lynx -nolist -dump $< > $@
72 install -m 0644 $(shell echo *.tex) $(DESTDIR)$(DOCDIR)
73 install -m 0644 $(shell echo *.sgml) $(DESTDIR)$(DOCDIR)
76 - rm -f *.aux *.log *.toc $(PSFILES) $(DVIFILES) *.html
77 + rm -f *.aux *.log *.toc $(PSFILES) $(DVIFILES) *.html $(TXTFILES)
78 --- iproute2-2.6.35.orig/include/linux/pkt_sched.h
79 +++ iproute2-2.6.35/include/linux/pkt_sched.h
82 +#ifndef __LINUX_PKT_SCHED_H
83 +#define __LINUX_PKT_SCHED_H
85 +/* Logical priority bands not depending on specific packet scheduler.
86 + Every scheduler will map them to real traffic classes, if it has
87 + no more precise mechanism to classify packets.
89 + These numbers have no special meaning, though their coincidence
90 + with obsolete IPv6 values is not occasional :-). New IPv6 drafts
91 + preferred full anarchy inspired by diffserv group.
93 + Note: TC_PRIO_BESTEFFORT does not mean that it is the most unhappy
94 + class, actually, as rule it will be handled with more care than
95 + filler or even bulk.
98 +#define TC_PRIO_BESTEFFORT 0
99 +#define TC_PRIO_FILLER 1
100 +#define TC_PRIO_BULK 2
101 +#define TC_PRIO_INTERACTIVE_BULK 4
102 +#define TC_PRIO_INTERACTIVE 6
103 +#define TC_PRIO_CONTROL 7
105 +#define TC_PRIO_MAX 15
107 +/* Generic queue statistics, available for all the elements.
108 + Particular schedulers may have also their private records.
113 + __u64 bytes; /* NUmber of enqueues bytes */
114 + __u32 packets; /* Number of enqueued packets */
115 + __u32 drops; /* Packets dropped because of lack of resources */
116 + __u32 overlimits; /* Number of throttle events when this
117 + * flow goes out of allocated bandwidth */
118 + __u32 bps; /* Current flow byte rate */
119 + __u32 pps; /* Current flow packet rate */
130 + unsigned char ewma_log;
136 + All the traffic control objects have 32bit identifiers, or "handles".
138 + They can be considered as opaque numbers from user API viewpoint,
139 + but actually they always consist of two fields: major and
140 + minor numbers, which are interpreted by kernel specially,
141 + that may be used by applications, though not recommended.
143 + F.e. qdisc handles always have minor number equal to zero,
144 + classes (or flows) have major equal to parent qdisc major, and
145 + minor uniquely identifying class inside qdisc.
147 + Macros to manipulate handles:
150 +#define TC_H_MAJ_MASK (0xFFFF0000U)
151 +#define TC_H_MIN_MASK (0x0000FFFFU)
152 +#define TC_H_MAJ(h) ((h)&TC_H_MAJ_MASK)
153 +#define TC_H_MIN(h) ((h)&TC_H_MIN_MASK)
154 +#define TC_H_MAKE(maj,min) (((maj)&TC_H_MAJ_MASK)|((min)&TC_H_MIN_MASK))
156 +#define TC_H_UNSPEC (0U)
157 +#define TC_H_ROOT (0xFFFFFFFFU)
158 +#define TC_H_INGRESS (0xFFFFFFF1U)
162 + unsigned char cell_log;
163 + unsigned char __reserved;
164 + unsigned short feature;
166 + unsigned short mpu;
174 + __u32 limit; /* Queue length: bytes for bfifo, packets for pfifo */
179 +#define TCQ_PRIO_BANDS 16
183 + int bands; /* Number of bands */
184 + __u8 priomap[TC_PRIO_MAX+1]; /* Map: logical priority -> PRIO band */
191 + int flows; /* Maximal number of guaranteed flows */
192 + unsigned char R_log; /* Fixed point position for round number */
193 + unsigned char delta_log; /* Log of maximal managed time interval */
194 + __u8 priomap[TC_PRIO_MAX+1]; /* Map: logical priority -> CSZ band */
199 + struct tc_ratespec slice;
200 + struct tc_ratespec rate;
201 + struct tc_ratespec peakrate;
219 + struct tc_ratespec rate;
220 + struct tc_ratespec peakrate;
237 +/* TEQL does not require any parameters */
243 + unsigned quantum; /* Bytes per round allocated to flow */
244 + int perturb_period; /* Period of hash perturbation */
245 + __u32 limit; /* Maximal packets in queue */
246 + unsigned divisor; /* Hash divisor */
247 + unsigned flows; /* Maximal number of flows */
251 + * NOTE: limit, divisor and flows are hardwired to code at the moment.
253 + * limit=flows=128, divisor=1024;
255 + * The only reason for this is efficiency, it is possible
256 + * to change these parameters in compile time.
270 + __u32 limit; /* HARD maximal queue length (bytes) */
271 + __u32 qth_min; /* Min average length threshold (bytes) */
272 + __u32 qth_max; /* Max average length threshold (bytes) */
273 + unsigned char Wlog; /* log(W) */
274 + unsigned char Plog; /* log(P_max/(qth_max-qth_min)) */
275 + unsigned char Scell_log; /* cell size for idle damping */
276 + unsigned char flags;
277 +#define TC_RED_ECN 1
280 +struct tc_red_xstats
282 + __u32 early; /* Early drops */
283 + __u32 pdrop; /* Drops due to queue limits */
284 + __u32 other; /* Drops due to drop() calls */
285 + __u32 marked; /* Marked packets */
300 +#define TCA_SET_OFF TCA_GRED_PARMS
303 + __u32 limit; /* HARD maximal queue length (bytes)
305 + __u32 qth_min; /* Min average length threshold (bytes)
307 + __u32 qth_max; /* Max average length threshold (bytes)
309 + __u32 DP; /* upto 2^32 DPs */
317 + unsigned char Wlog; /* log(W) */
318 + unsigned char Plog; /* log(P_max/(qth_max-qth_min)) */
319 + unsigned char Scell_log; /* cell size for idle damping */
320 + __u8 prio; /* prio of this VQ */
333 +#define TC_HTB_NUMPRIO 8
334 +#define TC_HTB_MAXDEPTH 8
335 +#define TC_HTB_PROTOVER 3 /* the same as HTB and TC's major */
339 + struct tc_ratespec rate;
340 + struct tc_ratespec ceil;
344 + __u32 level; /* out only */
349 + __u32 version; /* to match HTB/TC */
350 + __u32 rate2quantum; /* bps->quantum divisor */
351 + __u32 defcls; /* default class number */
352 + __u32 debug; /* debug flags */
355 + __u32 direct_pkts; /* count of non shapped packets */
365 +struct tc_htb_xstats
369 + __u32 giants; /* too big packets (rate will not be accurate) */
376 +#define TC_CBQ_MAXPRIO 8
377 +#define TC_CBQ_MAXLEVEL 8
378 +#define TC_CBQ_DEF_EWMA 5
380 +struct tc_cbq_lssopt
382 + unsigned char change;
383 + unsigned char flags;
384 +#define TCF_CBQ_LSS_BOUNDED 1
385 +#define TCF_CBQ_LSS_ISOLATED 2
386 + unsigned char ewma_log;
387 + unsigned char level;
388 +#define TCF_CBQ_LSS_FLAGS 1
389 +#define TCF_CBQ_LSS_EWMA 2
390 +#define TCF_CBQ_LSS_MAXIDLE 4
391 +#define TCF_CBQ_LSS_MINIDLE 8
392 +#define TCF_CBQ_LSS_OFFTIME 0x10
393 +#define TCF_CBQ_LSS_AVPKT 0x20
400 +struct tc_cbq_wrropt
402 + unsigned char flags;
403 + unsigned char priority;
404 + unsigned char cpriority;
405 + unsigned char __reserved;
412 + unsigned char strategy;
413 +#define TC_CBQ_OVL_CLASSIC 0
414 +#define TC_CBQ_OVL_DELAY 1
415 +#define TC_CBQ_OVL_LOWPRIO 2
416 +#define TC_CBQ_OVL_DROP 3
417 +#define TC_CBQ_OVL_RCLASSIC 4
418 + unsigned char priority2;
422 +struct tc_cbq_police
424 + unsigned char police;
425 + unsigned char __res1;
426 + unsigned short __res2;
436 +struct tc_cbq_xstats
450 + TCA_CBQ_OVL_STRATEGY,
456 +#define TCA_CBQ_MAX TCA_CBQ_POLICE
458 +/* dsmark section */
462 + TCA_DSMARK_INDICES,
463 + TCA_DSMARK_DEFAULT_INDEX,
464 + TCA_DSMARK_SET_TC_INDEX,
469 +#define TCA_DSMARK_MAX TCA_DSMARK_VALUE
475 + TCA_ATM_FD, /* file/socket descriptor */
476 + TCA_ATM_PTR, /* pointer to descriptor - later */
477 + TCA_ATM_HDR, /* LL header */
478 + TCA_ATM_EXCESS, /* excess traffic class (0 for CLP) */
479 + TCA_ATM_ADDR, /* PVC address (for output only) */
480 + TCA_ATM_STATE /* VC state (ATM_VS_*; for output only) */
483 +#define TCA_ATM_MAX TCA_ATM_STATE
487 #ifndef __LINUX_PKT_SCHED_H
488 #define __LINUX_PKT_SCHED_H
490 @@ -481,4 +887,116 @@ struct tc_drr_stats {
496 +/* Other includes */
497 +#include <linux/if_ether.h>
499 +// A sub weight and of a class
500 +// All numbers are represented as parts of (2^64-1).
501 +struct tc_wrr_class_weight {
502 + __u64 val; // Current value (0 is not valid)
503 + __u64 decr; // Value pr bytes (2^64-1 is not valid)
504 + __u64 incr; // Value pr seconds (2^64-1 is not valid)
505 + __u64 min; // Minimal value (0 is not valid)
506 + __u64 max; // Minimal value (0 is not valid)
508 +// The time where the above information was correct:
512 +// Packet send when modifying a class:
513 +struct tc_wrr_class_modf {
514 + // Not-valid values are ignored.
515 + struct tc_wrr_class_weight weight1;
516 + struct tc_wrr_class_weight weight2;
519 +// Packet returned when quering a class:
520 +struct tc_wrr_class_stats {
521 + char used; // If this is false the information below is invalid
523 + struct tc_wrr_class_modf class_modf;
525 + unsigned char addr[ETH_ALEN];
526 + char usemac; // True if addr is a MAC address, else it is an IP address
527 + // (this value is only for convience, it is always the same
528 + // value as in the qdisc)
529 + int heappos; // Current heap position or 0 if not in heap
530 + __u64 penal_ls; // Penalty value in heap (ls)
531 + __u64 penal_ms; // Penalty value in heap (ms)
534 +// Qdisc-wide penalty information (boolean values - 2 not valid)
535 +struct tc_wrr_qdisc_weight {
536 + char weight_mode; // 0=No automatic change to weight
537 + // 1=Decrease normally
538 + // 2=Also multiply with number of machines
539 + // 3=Instead multiply with priority divided
540 + // with priority of the other.
544 +// Packet send when modifing a qdisc:
545 +struct tc_wrr_qdisc_modf {
546 + // Not-valid values are ignored:
547 + struct tc_wrr_qdisc_weight weight1;
548 + struct tc_wrr_qdisc_weight weight2;
551 +// Packet send when creating a qdisc:
552 +struct tc_wrr_qdisc_crt {
553 + struct tc_wrr_qdisc_modf qdisc_modf;
555 + char srcaddr; // 1=lookup source, 0=lookup destination
556 + char usemac; // 1=Classify on MAC addresses, 0=classify on IP
557 + char usemasq; // 1=Classify based on masqgrading - only valid
558 + // if usemac is zero
559 + int bands_max; // Maximal number of bands (i.e.: classes)
560 + int proxy_maxconn;// If differnt from 0 then we support proxy remapping
561 + // of packets. And this is the number of maximal
562 + // concurrent proxy connections.
565 +// Packet returned when quering a qdisc:
566 +struct tc_wrr_qdisc_stats {
567 + struct tc_wrr_qdisc_crt qdisc_crt;
569 + int nodes_in_heap; // Current number of bands wanting to send something
570 + int bands_cur; // Current number of bands used (i.e.: MAC/IP addresses seen)
571 + int bands_reused; // Number of times this band has been reused.
572 + int packets_requed; // Number of times packets have been requeued.
573 + __u64 priosum; // Sum of priorities in heap where 1 is 2^32
576 +struct tc_wrr_qdisc_modf_std {
577 + // This indicates which of the tc_wrr_qdisc_modf structers this is:
578 + char proxy; // 0=This struct
580 + // Should we also change a class?
583 + // Only valid if change_class is false
584 + struct tc_wrr_qdisc_modf qdisc_modf;
586 + // Only valid if change_class is true:
587 + unsigned char addr[ETH_ALEN]; // Class to change (non-used bytes should be 0)
588 + struct tc_wrr_class_modf class_modf; // The change
591 +// Used for proxyrempping:
592 +struct tc_wrr_qdisc_modf_proxy {
593 + // This indicates which of the tc_wrr_qdisc_modf structers this is:
594 + char proxy; // 1=This struct
596 + // This is 1 if the proxyremap information should be reset
599 + // changec is the number of elements in changes.
602 + // This is an array of type ProxyRemapBlock:
607 --- iproute2-2.6.35.orig/ip/iptunnel.c
608 +++ iproute2-2.6.35/ip/iptunnel.c
609 @@ -130,7 +130,7 @@ static int parse_args(int argc, char **a
611 p->o_flags |= GRE_KEY;
612 if (strchr(*argv, '.'))
613 - p->o_key = get_addr32(*argv);
614 + p->i_key = get_addr32(*argv);
616 if (get_unsigned(&uval, *argv, 0)<0) {
617 fprintf(stderr, "invalid value of \"okey\"\n");
618 --- iproute2-2.6.35.orig/Makefile
619 +++ iproute2-2.6.35/Makefile
620 @@ -57,7 +57,7 @@ install: all
621 $(DESTDIR)$(DOCDIR)/examples
622 install -m 0644 $(shell find examples/diffserv -maxdepth 1 -type f) \
623 $(DESTDIR)$(DOCDIR)/examples/diffserv
624 - @for i in $(SUBDIRS) doc; do $(MAKE) -C $$i install; done
625 + @set -e; for i in $(SUBDIRS) doc; do $(MAKE) -C $$i install; done
626 install -m 0644 $(shell find etc/iproute2 -maxdepth 1 -type f) $(DESTDIR)$(CONFDIR)
627 install -m 0755 -d $(DESTDIR)$(MANDIR)/man8
628 install -m 0644 $(shell find man/man8 -maxdepth 1 -type f) $(DESTDIR)$(MANDIR)/man8
629 @@ -75,7 +75,7 @@ snapshot:
633 - @for i in $(SUBDIRS) doc; \
634 + @set -e; for i in $(SUBDIRS) doc; \
635 do $(MAKE) $(MFLAGS) -C $$i clean; done
638 --- iproute2-2.6.35.orig/misc/Makefile
639 +++ iproute2-2.6.35/misc/Makefile
641 SSOBJ=ss.o ssfilter.o
642 LNSTATOBJ=lnstat.o lnstat_util.o
644 -TARGETS=ss nstat ifstat rtacct arpd lnstat
645 +#TARGETS=ss nstat ifstat rtacct arpd lnstat
646 +TARGETS=ss nstat rtacct lnstat
650 --- iproute2-2.6.35.orig/tc/Makefile
651 +++ iproute2-2.6.35/tc/Makefile
652 @@ -15,6 +15,7 @@ TCMODULES += q_cbq.o
654 TCMODULES += q_multiq.o
655 TCMODULES += q_netem.o
656 +TCMODULES += q_wrr.o
657 TCMODULES += f_rsvp.o
659 TCMODULES += f_route.o
660 --- iproute2-2.6.35.orig/tc/q_htb.c
661 +++ iproute2-2.6.35/tc/q_htb.c
667 + * This program is free software; you can redistribute it and/or
668 + * modify it under the terms of the GNU General Public License
669 + * as published by the Free Software Foundation; either version
670 + * 2 of the License, or (at your option) any later version.
672 + * Authors: Martin Devera, devik@cdi.cz
681 +#include <sys/socket.h>
682 +#include <netinet/in.h>
683 +#include <arpa/inet.h>
687 +#include "tc_util.h"
689 +#define HTB_TC_VER 0x30003
690 +#if HTB_TC_VER >> 16 != TC_HTB_PROTOVER
691 +#error "Different kernel and TC HTB versions"
694 +static void explain(void)
696 + fprintf(stderr, "Usage: ... qdisc add ... htb [default N] [r2q N]\n"
697 + " default minor id of class to which unclassified packets are sent {0}\n"
698 + " r2q DRR quantums are computed as rate in Bps/r2q {10}\n"
699 + " debug string of 16 numbers each 0-3 {0}\n\n"
700 + "... class add ... htb rate R1 burst B1 [prio P] [slot S] [pslot PS]\n"
701 + " [ceil R2] [cburst B2] [mtu MTU] [quantum Q]\n"
702 + " rate rate allocated to this class (class can still borrow)\n"
703 + " burst max bytes burst which can be accumulated during idle period {computed}\n"
704 + " ceil definite upper class rate (no borrows) {rate}\n"
705 + " cburst burst but for ceil {computed}\n"
706 + " mtu max packet size we create rate map for {1600}\n"
707 + " prio priority of leaf; lower are served first {0}\n"
708 + " quantum how much bytes to serve from leaf at once {use r2q}\n"
709 + "\nTC HTB version %d.%d\n",HTB_TC_VER>>16,HTB_TC_VER&0xffff
713 +static void explain1(char *arg)
715 + fprintf(stderr, "Illegal \"%s\"\n", arg);
720 +#define usage() return(-1)
722 +static int htb_parse_opt(struct qdisc_util *qu, int argc, char **argv, struct nlmsghdr *n)
724 + struct tc_htb_glob opt;
725 + struct rtattr *tail;
726 + unsigned i; char *p;
727 + memset(&opt,0,sizeof(opt));
728 + opt.rate2quantum = 10;
732 + if (matches(*argv, "r2q") == 0) {
734 + if (get_u32(&opt.rate2quantum, *argv, 10)) {
735 + explain1("r2q"); return -1;
737 + } else if (matches(*argv, "default") == 0) {
739 + if (get_u32(&opt.defcls, *argv, 16)) {
740 + explain1("default"); return -1;
742 + } else if (matches(*argv, "debug") == 0) {
743 + NEXT_ARG(); p = *argv;
744 + for (i=0; i<16; i++,p++) {
745 + if (*p<'0' || *p>'3') break;
746 + opt.debug |= (*p-'0')<<(2*i);
749 + fprintf(stderr, "What is \"%s\"?\n", *argv);
755 + tail = (struct rtattr*)(((void*)n)+NLMSG_ALIGN(n->nlmsg_len));
756 + addattr_l(n, 1024, TCA_OPTIONS, NULL, 0);
757 + addattr_l(n, 2024, TCA_HTB_INIT, &opt, NLMSG_ALIGN(sizeof(opt)));
758 + tail->rta_len = (((void*)n)+NLMSG_ALIGN(n->nlmsg_len)) - (void*)tail;
762 +static int htb_parse_class_opt(struct qdisc_util *qu, int argc, char **argv, struct nlmsghdr *n)
765 + struct tc_htb_opt opt;
766 + __u32 rtab[256],ctab[256];
767 + unsigned buffer=0,cbuffer=0;
768 + int cell_log=-1,ccell_log = -1,mtu;
769 + struct rtattr *tail;
771 + memset(&opt, 0, sizeof(opt)); mtu = 1600; /* eth packet len */
774 + if (matches(*argv, "prio") == 0) {
776 + if (get_u32(&opt.prio, *argv, 10)) {
777 + explain1("prio"); return -1;
780 + } else if (matches(*argv, "mtu") == 0) {
782 + if (get_u32(&mtu, *argv, 10)) {
783 + explain1("mtu"); return -1;
785 + } else if (matches(*argv, "quantum") == 0) {
787 + if (get_u32(&opt.quantum, *argv, 10)) {
788 + explain1("quantum"); return -1;
790 + } else if (matches(*argv, "burst") == 0 ||
791 + strcmp(*argv, "buffer") == 0 ||
792 + strcmp(*argv, "maxburst") == 0) {
794 + if (get_size_and_cell(&buffer, &cell_log, *argv) < 0) {
795 + explain1("buffer");
799 + } else if (matches(*argv, "cburst") == 0 ||
800 + strcmp(*argv, "cbuffer") == 0 ||
801 + strcmp(*argv, "cmaxburst") == 0) {
803 + if (get_size_and_cell(&cbuffer, &ccell_log, *argv) < 0) {
804 + explain1("cbuffer");
808 + } else if (strcmp(*argv, "ceil") == 0) {
810 + if (opt.ceil.rate) {
811 + fprintf(stderr, "Double \"ceil\" spec\n");
814 + if (get_rate(&opt.ceil.rate, *argv)) {
819 + } else if (strcmp(*argv, "rate") == 0) {
821 + if (opt.rate.rate) {
822 + fprintf(stderr, "Double \"rate\" spec\n");
825 + if (get_rate(&opt.rate.rate, *argv)) {
830 + } else if (strcmp(*argv, "help") == 0) {
834 + fprintf(stderr, "What is \"%s\"?\n", *argv);
844 + if (opt.rate.rate == 0) {
845 + fprintf(stderr, "\"rate\" is required.\n");
848 + /* if ceil params are missing, use the same as rate */
849 + if (!opt.ceil.rate) opt.ceil = opt.rate;
851 + /* compute minimal allowed burst from rate; mtu is added here to make
852 + sute that buffer is larger than mtu and to have some safeguard space */
853 + if (!buffer) buffer = opt.rate.rate / HZ + mtu;
854 + if (!cbuffer) cbuffer = opt.ceil.rate / HZ + mtu;
856 + if ((cell_log = tc_calc_rtable(opt.rate.rate, rtab, cell_log, mtu, 0)) < 0) {
857 + fprintf(stderr, "htb: failed to calculate rate table.\n");
860 + opt.buffer = tc_calc_xmittime(opt.rate.rate, buffer);
861 + opt.rate.cell_log = cell_log;
863 + if ((ccell_log = tc_calc_rtable(opt.ceil.rate, ctab, cell_log, mtu, 0)) < 0) {
864 + fprintf(stderr, "htb: failed to calculate ceil rate table.\n");
867 + opt.cbuffer = tc_calc_xmittime(opt.ceil.rate, cbuffer);
868 + opt.ceil.cell_log = ccell_log;
870 + tail = (struct rtattr*)(((void*)n)+NLMSG_ALIGN(n->nlmsg_len));
871 + addattr_l(n, 1024, TCA_OPTIONS, NULL, 0);
872 + addattr_l(n, 2024, TCA_HTB_PARMS, &opt, sizeof(opt));
873 + addattr_l(n, 3024, TCA_HTB_RTAB, rtab, 1024);
874 + addattr_l(n, 4024, TCA_HTB_CTAB, ctab, 1024);
875 + tail->rta_len = (((void*)n)+NLMSG_ALIGN(n->nlmsg_len)) - (void*)tail;
879 +static int htb_print_opt(struct qdisc_util *qu, FILE *f, struct rtattr *opt)
881 + struct rtattr *tb[TCA_HTB_RTAB+1];
882 + struct tc_htb_opt *hopt;
883 + struct tc_htb_glob *gopt;
884 + double buffer,cbuffer;
891 + memset(tb, 0, sizeof(tb));
892 + parse_rtattr(tb, TCA_HTB_RTAB, RTA_DATA(opt), RTA_PAYLOAD(opt));
894 + if (tb[TCA_HTB_PARMS]) {
896 + hopt = RTA_DATA(tb[TCA_HTB_PARMS]);
897 + if (RTA_PAYLOAD(tb[TCA_HTB_PARMS]) < sizeof(*hopt)) return -1;
899 + if (!hopt->level) {
900 + fprintf(f, "prio %d ", (int)hopt->prio);
902 + fprintf(f, "quantum %d ", (int)hopt->quantum);
904 + fprintf(f, "rate %s ", sprint_rate(hopt->rate.rate, b1));
905 + buffer = ((double)hopt->rate.rate*tc_core_tick2usec(hopt->buffer))/1000000;
906 + fprintf(f, "ceil %s ", sprint_rate(hopt->ceil.rate, b1));
907 + cbuffer = ((double)hopt->ceil.rate*tc_core_tick2usec(hopt->cbuffer))/1000000;
908 + if (show_details) {
909 + fprintf(f, "burst %s/%u mpu %s ", sprint_size(buffer, b1),
910 + 1<<hopt->rate.cell_log, sprint_size(hopt->rate.mpu, b2));
911 + fprintf(f, "cburst %s/%u mpu %s ", sprint_size(cbuffer, b1),
912 + 1<<hopt->ceil.cell_log, sprint_size(hopt->ceil.mpu, b2));
913 + fprintf(f, "level %d ", (int)hopt->level);
915 + fprintf(f, "burst %s ", sprint_size(buffer, b1));
916 + fprintf(f, "cburst %s ", sprint_size(cbuffer, b1));
919 + fprintf(f, "buffer [%08x] cbuffer [%08x] ",
920 + hopt->buffer,hopt->cbuffer);
922 + if (tb[TCA_HTB_INIT]) {
923 + gopt = RTA_DATA(tb[TCA_HTB_INIT]);
924 + if (RTA_PAYLOAD(tb[TCA_HTB_INIT]) < sizeof(*gopt)) return -1;
926 + fprintf(f, "r2q %d default %x direct_packets_stat %u",
927 + gopt->rate2quantum,gopt->defcls,gopt->direct_pkts);
929 + fprintf(f," ver %d.%d",gopt->version >> 16,gopt->version & 0xffff);
934 +static int htb_print_xstats(struct qdisc_util *qu, FILE *f, struct rtattr *xstats)
936 + struct tc_htb_xstats *st;
937 + if (xstats == NULL)
940 + if (RTA_PAYLOAD(xstats) < sizeof(*st))
943 + st = RTA_DATA(xstats);
944 + fprintf(f, " lended: %u borrowed: %u giants: %u\n",
945 + st->lends,st->borrows,st->giants);
946 + fprintf(f, " tokens: %d ctokens: %d\n", st->tokens,st->ctokens);
950 +struct qdisc_util htb_util = {
956 + htb_parse_class_opt,
960 +/* for testing of old one */
961 +struct qdisc_util htb2_util = {
967 + htb_parse_class_opt,
975 +++ iproute2-2.6.35/tc/q_wrr.c
982 +#include <sys/socket.h>
983 +#include <netinet/in.h>
984 +#include <arpa/inet.h>
989 +#include "tc_util.h"
991 +#define usage() return(-1)
993 +// Returns -1 on error
994 +static int wrr_parse_qdisc_weight(int argc, char** argv,
995 + struct tc_wrr_qdisc_modf* opt) {
998 + opt->weight1.weight_mode=-1;
999 + opt->weight2.weight_mode=-1;
1001 + for(i=0; i<argc; i++) {
1002 + if(!memcmp(argv[i],"wmode1=",7)) {
1003 + opt->weight1.weight_mode=atoi(argv[i]+7);
1004 + } else if(!memcmp(argv[i],"wmode2=",7)) {
1005 + opt->weight2.weight_mode=atoi(argv[i]+7);
1007 + printf("Usage: ... [wmode1=0|1|2|3] [wmode2=0|1|2|3]\n");
1014 +static int wrr_parse_class_modf(int argc, char** argv,
1015 + struct tc_wrr_class_modf* modf) {
1019 + fprintf(stderr, "Usage: ... [weight1=val] [decr1=val] [incr1=val] [min1=val] [max1=val] [val2=val] ...\n");
1020 + fprintf(stderr, " The values can be floating point like 0.42 or divisions like 42/100\n");
1024 + // Set meaningless values:
1025 + modf->weight1.val=0;
1026 + modf->weight1.decr=(__u64)-1;
1027 + modf->weight1.incr=(__u64)-1;
1028 + modf->weight1.min=0;
1029 + modf->weight1.max=0;
1030 + modf->weight2.val=0;
1031 + modf->weight2.decr=(__u64)-1;
1032 + modf->weight2.incr=(__u64)-1;
1033 + modf->weight2.min=0;
1034 + modf->weight2.max=0;
1036 + // And read values:
1037 + for(i=0; i<argc; i++) {
1039 + char* name,*value1=0,*value2=0;
1040 + long double f_val1,f_val2=1,value;
1041 + if(strlen(argv[i])>=sizeof(arg)) {
1042 + fprintf(stderr,"Argument too long: %s\n",argv[i]);
1045 + strcpy(arg,argv[i]);
1047 + name=strtok(arg,"=");
1048 + if(name) value1=strtok(0,"/");
1049 + if(value1) value2=strtok(0,"");
1052 + fprintf(stderr,"No = found in argument: %s\n",argv[i]);
1056 + f_val1=atof(value1);
1057 + if(value2) f_val2=atof(value2);
1060 + fprintf(stderr,"Division by 0\n");
1064 + value=f_val1/f_val2;
1065 + if(value>1) value=1;
1066 + if(value<0) value=0;
1067 + value*=((__u64)-1);
1069 + // And find the value set
1070 + if(!strcmp(name,"weight1")) modf->weight1.val=value;
1071 + else if(!strcmp(name,"decr1")) modf->weight1.decr=value;
1072 + else if(!strcmp(name,"incr1")) modf->weight1.incr=value;
1073 + else if(!strcmp(name,"min1")) modf->weight1.min=value;
1074 + else if(!strcmp(name,"max1")) modf->weight1.max=value;
1075 + else if(!strcmp(name,"weight2")) modf->weight2.val=value;
1076 + else if(!strcmp(name,"decr2")) modf->weight2.decr=value;
1077 + else if(!strcmp(name,"incr2")) modf->weight2.incr=value;
1078 + else if(!strcmp(name,"min2")) modf->weight2.min=value;
1079 + else if(!strcmp(name,"max2")) modf->weight2.max=value;
1081 + fprintf(stderr,"illegal value: %s\n",name);
1089 +static int wrr_parse_opt(struct qdisc_util *qu, int argc, char **argv, struct nlmsghdr *n)
1091 + if(n->nlmsg_flags & NLM_F_CREATE) {
1092 + // This is a create request:
1093 + struct tc_wrr_qdisc_crt opt;
1095 + int sour,dest,ip,mac,masq;
1098 + fprintf(stderr, "Usage: ... wrr sour|dest ip|masq|mac maxclasses proxymaxcon [penalty-setup]\n");
1102 + // Read sour/dest:
1103 + memset(&opt,0,sizeof(opt));
1104 + sour=!strcmp(argv[0],"sour");
1105 + dest=!strcmp(argv[0],"dest");
1107 + if(!sour && !dest) {
1108 + fprintf(stderr,"sour or dest must be specified\n");
1113 + ip=!strcmp(argv[1],"ip");
1114 + mac=!strcmp(argv[1],"mac");
1115 + masq=!strcmp(argv[1],"masq");
1117 + if(!ip && !mac && !masq) {
1118 + fprintf(stderr,"ip, masq or mac must be specified\n");
1125 + opt.bands_max=atoi(argv[2]);
1127 + opt.proxy_maxconn=atoi(argv[3]);
1130 + if(wrr_parse_qdisc_weight(argc-4,argv+4,&opt.qdisc_modf)<0) return -1;
1131 + if(opt.qdisc_modf.weight1.weight_mode==-1) opt.qdisc_modf.weight1.weight_mode=0;
1132 + if(opt.qdisc_modf.weight2.weight_mode==-1) opt.qdisc_modf.weight2.weight_mode=0;
1134 + addattr_l(n, 1024, TCA_OPTIONS, &opt, sizeof(opt));
1136 + struct tc_wrr_qdisc_modf_std opt;
1139 + // This is a modify request:
1141 + fprintf(stderr,"... qdisc ... or ... class ...\n");
1145 + qdisc=!strcmp(argv[0],"qdisc");
1146 + class=!strcmp(argv[0],"class");
1148 + if(!qdisc && !class) {
1149 + fprintf(stderr,"qdisc or class must be specified\n");
1159 + opt.change_class=0;
1160 + if(wrr_parse_qdisc_weight(argc, argv, &opt.qdisc_modf)<0) return -1;
1162 + int a0,a1,a2,a3,a4=0,a5=0;
1164 + opt.change_class=1;
1167 + fprintf(stderr,"... <mac>|<ip>|<masq> ...\n");
1170 + memset(opt.addr,0,sizeof(opt.addr));
1172 + if((sscanf(argv[0],"%i.%i.%i.%i",&a0,&a1,&a2,&a3)!=4) &&
1173 + (sscanf(argv[0],"%x:%x:%x:%x:%x:%x",&a0,&a1,&a2,&a3,&a4,&a5)!=6)) {
1174 + fprintf(stderr,"Wrong format of mac or ip address\n");
1178 + opt.addr[0]=a0; opt.addr[1]=a1; opt.addr[2]=a2;
1179 + opt.addr[3]=a3; opt.addr[4]=a4; opt.addr[5]=a5;
1181 + if(wrr_parse_class_modf(argc-1, argv+1, &opt.class_modf)<0) return -1;
1184 + addattr_l(n, 1024, TCA_OPTIONS, &opt, sizeof(opt));
1189 +static int wrr_parse_copt(struct qdisc_util *qu, int argc, char **argv, struct nlmsghdr *n) {
1190 + struct tc_wrr_class_modf opt;
1192 + memset(&opt,0,sizeof(opt));
1193 + if(wrr_parse_class_modf(argc,argv,&opt)<0) return -1;
1195 + addattr_l(n, 1024, TCA_OPTIONS, &opt, sizeof(opt));
1199 +static int wrr_print_opt(struct qdisc_util *qu, FILE *f, struct rtattr *opt)
1201 + struct tc_wrr_qdisc_stats *qopt;
1206 + if (RTA_PAYLOAD(opt) < sizeof(*qopt))
1208 + qopt = RTA_DATA(opt);
1210 + fprintf(f,"\n (%s/%s) (maxclasses %i) (usedclasses %i) (reused classes %i)\n",
1211 + qopt->qdisc_crt.srcaddr ? "sour" : "dest",
1212 + qopt->qdisc_crt.usemac ? "mac" : (qopt->qdisc_crt.usemasq ? "masq" : "ip"),
1213 + qopt->qdisc_crt.bands_max,
1215 + qopt->bands_reused
1218 + if(qopt->qdisc_crt.proxy_maxconn) {
1219 + fprintf(f," (proxy maxcon %i) (proxy curcon %i)\n",
1220 + qopt->qdisc_crt.proxy_maxconn,qopt->proxy_curconn);
1223 + fprintf(f," (waiting classes %i) (packets requeued %i) (priosum: %Lg)\n",
1224 + qopt->nodes_in_heap,
1225 + qopt->packets_requed,
1226 + qopt->priosum/((long double)((__u32)-1))
1229 + fprintf(f," (wmode1 %i) (wmode2 %i) \n",
1230 + qopt->qdisc_crt.qdisc_modf.weight1.weight_mode,
1231 + qopt->qdisc_crt.qdisc_modf.weight2.weight_mode);
1236 +static int wrr_print_copt(struct qdisc_util *qu, FILE *f, struct rtattr *opt) {
1237 + struct tc_wrr_class_stats *copt;
1238 + long double d=(__u64)-1;
1240 + if (opt == NULL) return 0;
1242 + if (RTA_PAYLOAD(opt) < sizeof(*copt))
1244 + copt = RTA_DATA(opt);
1247 + fprintf(f,"(unused)");
1251 + if(copt->usemac) {
1252 + fprintf(f,"\n (address: %.2X:%.2X:%.2X:%.2X:%.2X:%.2X)\n",
1253 + copt->addr[0],copt->addr[1],copt->addr[2],
1254 + copt->addr[3],copt->addr[4],copt->addr[5]);
1256 + fprintf(f,"\n (address: %i.%i.%i.%i)\n",copt->addr[0],copt->addr[1],copt->addr[2],copt->addr[3]);
1259 + fprintf(f," (total weight: %Lg) (current position: %i) (counters: %u %u : %u %u)\n",
1260 + (copt->class_modf.weight1.val/d)*(copt->class_modf.weight2.val/d),
1262 + (unsigned)(copt->penal_ms>>32),
1263 + (unsigned)(copt->penal_ms & 0xffffffffU),
1264 + (unsigned)(copt->penal_ls>>32),
1265 + (unsigned)(copt->penal_ls & 0xffffffffU)
1268 + fprintf(f," Pars 1: (weight %Lg) (decr: %Lg) (incr: %Lg) (min: %Lg) (max: %Lg)\n",
1269 + copt->class_modf.weight1.val/d,
1270 + copt->class_modf.weight1.decr/d,
1271 + copt->class_modf.weight1.incr/d,
1272 + copt->class_modf.weight1.min/d,
1273 + copt->class_modf.weight1.max/d);
1275 + fprintf(f," Pars 2: (weight %Lg) (decr: %Lg) (incr: %Lg) (min: %Lg) (max: %Lg)",
1276 + copt->class_modf.weight2.val/d,
1277 + copt->class_modf.weight2.decr/d,
1278 + copt->class_modf.weight2.incr/d,
1279 + copt->class_modf.weight2.min/d,
1280 + copt->class_modf.weight2.max/d);
1285 +static int wrr_print_xstats(struct qdisc_util *qu, FILE *f, struct rtattr *xstats)
1291 +struct qdisc_util wrr_qdisc_util = {
1293 + .parse_qopt = wrr_parse_opt,
1294 + .print_qopt = wrr_print_opt,
1295 + .print_xstats = wrr_print_xstats,
1296 + .parse_copt = wrr_parse_copt,
1297 + .print_copt = wrr_print_copt