1 /*
2  * tc_core.c		TC core library.
3  *
4  *		This program is free software; you can redistribute it and/or
5  *		modify it under the terms of the GNU General Public License
6  *		as published by the Free Software Foundation; either version
7  *		2 of the License, or (at your option) any later version.
8  *
9  * Authors:	Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10  *
11  */
12 
13 #include <stdio.h>
14 #include <stdlib.h>
15 #include <stdint.h>
16 #include <unistd.h>
17 #include <syslog.h>
18 #include <fcntl.h>
19 #include <math.h>
20 #include <sys/socket.h>
21 #include <netinet/in.h>
22 #include <arpa/inet.h>
23 #include <string.h>
24 
25 #include "tc_core.h"
26 #include <linux/atm.h>
27 
28 static double tick_in_usec = 1;
29 static double clock_factor = 1;
30 
tc_core_time2big(unsigned int time)31 int tc_core_time2big(unsigned int time)
32 {
33 	__u64 t = time;
34 
35 	t *= tick_in_usec;
36 	return (t >> 32) != 0;
37 }
38 
39 
tc_core_time2tick(unsigned int time)40 unsigned int tc_core_time2tick(unsigned int time)
41 {
42 	return time*tick_in_usec;
43 }
44 
tc_core_tick2time(unsigned int tick)45 unsigned int tc_core_tick2time(unsigned int tick)
46 {
47 	return tick/tick_in_usec;
48 }
49 
tc_core_time2ktime(unsigned int time)50 unsigned int tc_core_time2ktime(unsigned int time)
51 {
52 	return time * clock_factor;
53 }
54 
tc_core_ktime2time(unsigned int ktime)55 unsigned int tc_core_ktime2time(unsigned int ktime)
56 {
57 	return ktime / clock_factor;
58 }
59 
tc_calc_xmittime(__u64 rate,unsigned int size)60 unsigned int tc_calc_xmittime(__u64 rate, unsigned int size)
61 {
62 	return tc_core_time2tick(TIME_UNITS_PER_SEC*((double)size/(double)rate));
63 }
64 
tc_calc_xmitsize(__u64 rate,unsigned int ticks)65 unsigned int tc_calc_xmitsize(__u64 rate, unsigned int ticks)
66 {
67 	return ((double)rate*tc_core_tick2time(ticks))/TIME_UNITS_PER_SEC;
68 }
69 
70 /*
71  * The align to ATM cells is used for determining the (ATM) SAR
72  * alignment overhead at the ATM layer. (SAR = Segmentation And
73  * Reassembly).  This is for example needed when scheduling packet on
74  * an ADSL connection.  Note that the extra ATM-AAL overhead is _not_
75  * included in this calculation. This overhead is added in the kernel
76  * before doing the rate table lookup, as this gives better precision
77  * (as the table will always be aligned for 48 bytes).
78  *  --Hawk, d.7/11-2004. <hawk@diku.dk>
79  */
tc_align_to_atm(unsigned int size)80 static unsigned int tc_align_to_atm(unsigned int size)
81 {
82 	int linksize, cells;
83 
84 	cells = size / ATM_CELL_PAYLOAD;
85 	if ((size % ATM_CELL_PAYLOAD) > 0)
86 		cells++;
87 
88 	linksize = cells * ATM_CELL_SIZE; /* Use full cell size to add ATM tax */
89 	return linksize;
90 }
91 
tc_adjust_size(unsigned int sz,unsigned int mpu,enum link_layer linklayer)92 static unsigned int tc_adjust_size(unsigned int sz, unsigned int mpu, enum link_layer linklayer)
93 {
94 	if (sz < mpu)
95 		sz = mpu;
96 
97 	switch (linklayer) {
98 	case LINKLAYER_ATM:
99 		return tc_align_to_atm(sz);
100 	case LINKLAYER_ETHERNET:
101 	default:
102 		/* No size adjustments on Ethernet */
103 		return sz;
104 	}
105 }
106 
107 /* Notice, the rate table calculated here, have gotten replaced in the
108  * kernel and is no-longer used for lookups.
109  *
110  * This happened in kernel release v3.8 caused by kernel
111  *  - commit 56b765b79 ("htb: improved accuracy at high rates").
112  * This change unfortunately caused breakage of tc overhead and
113  * linklayer parameters.
114  *
115  * Kernel overhead handling got fixed in kernel v3.10 by
116  * - commit 01cb71d2d47 (net_sched: restore "overhead xxx" handling)
117  *
118  * Kernel linklayer handling got fixed in kernel v3.11 by
119  * - commit 8a8e3d84b17 (net_sched: restore "linklayer atm" handling)
120  */
121 
122 /*
123    rtab[pkt_len>>cell_log] = pkt_xmit_time
124  */
125 
tc_calc_rtable(struct tc_ratespec * r,__u32 * rtab,int cell_log,unsigned int mtu,enum link_layer linklayer)126 int tc_calc_rtable(struct tc_ratespec *r, __u32 *rtab,
127 		   int cell_log, unsigned int mtu,
128 		   enum link_layer linklayer)
129 {
130 	int i;
131 	unsigned int sz;
132 	unsigned int bps = r->rate;
133 	unsigned int mpu = r->mpu;
134 
135 	if (mtu == 0)
136 		mtu = 2047;
137 
138 	if (cell_log < 0) {
139 		cell_log = 0;
140 		while ((mtu >> cell_log) > 255)
141 			cell_log++;
142 	}
143 
144 	for (i = 0; i < 256; i++) {
145 		sz = tc_adjust_size((i + 1) << cell_log, mpu, linklayer);
146 		rtab[i] = tc_calc_xmittime(bps, sz);
147 	}
148 
149 	r->cell_align =  -1;
150 	r->cell_log = cell_log;
151 	r->linklayer = (linklayer & TC_LINKLAYER_MASK);
152 	return cell_log;
153 }
154 
155 /*
156    stab[pkt_len>>cell_log] = pkt_xmit_size>>size_log
157  */
158 
tc_calc_size_table(struct tc_sizespec * s,__u16 ** stab)159 int tc_calc_size_table(struct tc_sizespec *s, __u16 **stab)
160 {
161 	int i;
162 	enum link_layer linklayer = s->linklayer;
163 	unsigned int sz;
164 
165 	if (linklayer <= LINKLAYER_ETHERNET && s->mpu == 0) {
166 		/* don't need data table in this case (only overhead set) */
167 		s->mtu = 0;
168 		s->tsize = 0;
169 		s->cell_log = 0;
170 		s->cell_align = 0;
171 		*stab = NULL;
172 		return 0;
173 	}
174 
175 	if (s->mtu == 0)
176 		s->mtu = 2047;
177 	if (s->tsize == 0)
178 		s->tsize = 512;
179 
180 	s->cell_log = 0;
181 	while ((s->mtu >> s->cell_log) > s->tsize - 1)
182 		s->cell_log++;
183 
184 	*stab = malloc(s->tsize * sizeof(__u16));
185 	if (!*stab)
186 		return -1;
187 
188 again:
189 	for (i = s->tsize - 1; i >= 0; i--) {
190 		sz = tc_adjust_size((i + 1) << s->cell_log, s->mpu, linklayer);
191 		if ((sz >> s->size_log) > UINT16_MAX) {
192 			s->size_log++;
193 			goto again;
194 		}
195 		(*stab)[i] = sz >> s->size_log;
196 	}
197 
198 	s->cell_align = -1; /* Due to the sz calc */
199 	return 0;
200 }
201 
tc_core_init(void)202 int tc_core_init(void)
203 {
204 	FILE *fp;
205 	__u32 clock_res;
206 	__u32 t2us;
207 	__u32 us2t;
208 
209 	fp = fopen("/proc/net/psched", "r");
210 	if (fp == NULL)
211 		return -1;
212 
213 	if (fscanf(fp, "%08x%08x%08x", &t2us, &us2t, &clock_res) != 3) {
214 		fclose(fp);
215 		return -1;
216 	}
217 	fclose(fp);
218 
219 	/* compatibility hack: for old iproute binaries (ignoring
220 	 * the kernel clock resolution) the kernel advertises a
221 	 * tick multiplier of 1000 in case of nano-second resolution,
222 	 * which really is 1. */
223 	if (clock_res == 1000000000)
224 		t2us = us2t;
225 
226 	clock_factor  = (double)clock_res / TIME_UNITS_PER_SEC;
227 	tick_in_usec = (double)t2us / us2t * clock_factor;
228 	return 0;
229 }
230