uipc_mbuf.c revision 1.44 1 1.44 itojun /* $NetBSD: uipc_mbuf.c,v 1.44 1999/10/27 14:23:27 itojun Exp $ */
2 1.42 thorpej
3 1.42 thorpej /*-
4 1.42 thorpej * Copyright (c) 1999 The NetBSD Foundation, Inc.
5 1.42 thorpej * All rights reserved.
6 1.42 thorpej *
7 1.42 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.42 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.42 thorpej * NASA Ames Research Center.
10 1.42 thorpej *
11 1.42 thorpej * Redistribution and use in source and binary forms, with or without
12 1.42 thorpej * modification, are permitted provided that the following conditions
13 1.42 thorpej * are met:
14 1.42 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.42 thorpej * notice, this list of conditions and the following disclaimer.
16 1.42 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.42 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.42 thorpej * documentation and/or other materials provided with the distribution.
19 1.42 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.42 thorpej * must display the following acknowledgement:
21 1.42 thorpej * This product includes software developed by the NetBSD
22 1.42 thorpej * Foundation, Inc. and its contributors.
23 1.42 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.42 thorpej * contributors may be used to endorse or promote products derived
25 1.42 thorpej * from this software without specific prior written permission.
26 1.42 thorpej *
27 1.42 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.42 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.42 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.42 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.42 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.42 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.42 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.42 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.42 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.42 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.42 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.42 thorpej */
39 1.10 cgd
40 1.1 cgd /*
41 1.9 mycroft * Copyright (c) 1982, 1986, 1988, 1991, 1993
42 1.9 mycroft * The Regents of the University of California. All rights reserved.
43 1.1 cgd *
44 1.1 cgd * Redistribution and use in source and binary forms, with or without
45 1.1 cgd * modification, are permitted provided that the following conditions
46 1.1 cgd * are met:
47 1.1 cgd * 1. Redistributions of source code must retain the above copyright
48 1.1 cgd * notice, this list of conditions and the following disclaimer.
49 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
50 1.1 cgd * notice, this list of conditions and the following disclaimer in the
51 1.1 cgd * documentation and/or other materials provided with the distribution.
52 1.1 cgd * 3. All advertising materials mentioning features or use of this software
53 1.1 cgd * must display the following acknowledgement:
54 1.1 cgd * This product includes software developed by the University of
55 1.1 cgd * California, Berkeley and its contributors.
56 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
57 1.1 cgd * may be used to endorse or promote products derived from this software
58 1.1 cgd * without specific prior written permission.
59 1.1 cgd *
60 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
61 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
62 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
63 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
64 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
65 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
66 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
67 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
68 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
69 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
70 1.1 cgd * SUCH DAMAGE.
71 1.1 cgd *
72 1.26 fvdl * @(#)uipc_mbuf.c 8.4 (Berkeley) 2/14/95
73 1.1 cgd */
74 1.24 mrg
75 1.6 mycroft #include <sys/param.h>
76 1.6 mycroft #include <sys/systm.h>
77 1.6 mycroft #include <sys/proc.h>
78 1.6 mycroft #include <sys/malloc.h>
79 1.9 mycroft #include <sys/map.h>
80 1.1 cgd #define MBTYPES
81 1.6 mycroft #include <sys/mbuf.h>
82 1.6 mycroft #include <sys/kernel.h>
83 1.6 mycroft #include <sys/syslog.h>
84 1.6 mycroft #include <sys/domain.h>
85 1.6 mycroft #include <sys/protosw.h>
86 1.28 thorpej #include <sys/pool.h>
87 1.27 matt #include <sys/socket.h>
88 1.27 matt #include <net/if.h>
89 1.6 mycroft
90 1.6 mycroft #include <vm/vm.h>
91 1.42 thorpej #include <vm/vm_kern.h>
92 1.14 christos
93 1.23 mrg #include <uvm/uvm_extern.h>
94 1.23 mrg
95 1.42 thorpej #include <sys/sysctl.h>
96 1.42 thorpej
97 1.28 thorpej struct pool mbpool; /* mbuf pool */
98 1.28 thorpej struct pool mclpool; /* mbuf cluster pool */
99 1.28 thorpej
100 1.18 thorpej struct mbstat mbstat;
101 1.18 thorpej int max_linkhdr;
102 1.18 thorpej int max_protohdr;
103 1.18 thorpej int max_hdr;
104 1.18 thorpej int max_datalen;
105 1.18 thorpej
106 1.28 thorpej void *mclpool_alloc __P((unsigned long, int, int));
107 1.28 thorpej void mclpool_release __P((void *, unsigned long, int));
108 1.44 itojun static struct mbuf *m_copym0 __P((struct mbuf *, int, int, int, int));
109 1.28 thorpej
110 1.42 thorpej const char *mclpool_warnmsg =
111 1.42 thorpej "WARNING: mclpool limit reached; increase NMBCLUSTERS";
112 1.42 thorpej
113 1.28 thorpej /*
114 1.40 thorpej * Initialize the mbuf allcator.
115 1.28 thorpej */
116 1.4 jtc void
117 1.1 cgd mbinit()
118 1.1 cgd {
119 1.1 cgd
120 1.42 thorpej pool_init(&mbpool, msize, 0, 0, 0, "mbpl", 0, NULL, NULL, 0);
121 1.42 thorpej pool_init(&mclpool, mclbytes, 0, 0, 0, "mclpl", 0, mclpool_alloc,
122 1.28 thorpej mclpool_release, 0);
123 1.37 thorpej
124 1.37 thorpej /*
125 1.39 thorpej * Set the hard limit on the mclpool to the number of
126 1.39 thorpej * mbuf clusters the kernel is to support. Log the limit
127 1.39 thorpej * reached message max once a minute.
128 1.39 thorpej */
129 1.42 thorpej pool_sethardlimit(&mclpool, nmbclusters, mclpool_warnmsg, 60);
130 1.42 thorpej
131 1.39 thorpej /*
132 1.42 thorpej * Set a low water mark for both mbufs and clusters. This should
133 1.42 thorpej * help ensure that they can be allocated in a memory starvation
134 1.42 thorpej * situation. This is important for e.g. diskless systems which
135 1.42 thorpej * must allocate mbufs in order for the pagedaemon to clean pages.
136 1.37 thorpej */
137 1.42 thorpej pool_setlowat(&mbpool, mblowat);
138 1.42 thorpej pool_setlowat(&mclpool, mcllowat);
139 1.42 thorpej }
140 1.42 thorpej
141 1.42 thorpej int
142 1.42 thorpej sysctl_dombuf(name, namelen, oldp, oldlenp, newp, newlen)
143 1.42 thorpej int *name;
144 1.42 thorpej u_int namelen;
145 1.42 thorpej void *oldp;
146 1.42 thorpej size_t *oldlenp;
147 1.42 thorpej void *newp;
148 1.42 thorpej size_t newlen;
149 1.42 thorpej {
150 1.42 thorpej int error, newval;
151 1.42 thorpej
152 1.42 thorpej /* All sysctl names at this level are terminal. */
153 1.42 thorpej if (namelen != 1)
154 1.42 thorpej return (ENOTDIR); /* overloaded */
155 1.42 thorpej
156 1.42 thorpej switch (name[0]) {
157 1.42 thorpej case MBUF_MSIZE:
158 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, msize));
159 1.42 thorpej case MBUF_MCLBYTES:
160 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, mclbytes));
161 1.42 thorpej case MBUF_NMBCLUSTERS:
162 1.42 thorpej /*
163 1.42 thorpej * If we have direct-mapped pool pages, we can adjust this
164 1.42 thorpej * number on the fly. If not, we're limited by the size
165 1.42 thorpej * of mb_map, and cannot change this value.
166 1.42 thorpej *
167 1.42 thorpej * Note: we only allow the value to be increased, never
168 1.42 thorpej * decreased.
169 1.42 thorpej */
170 1.42 thorpej if (mb_map == NULL) {
171 1.42 thorpej newval = nmbclusters;
172 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen,
173 1.42 thorpej &newval);
174 1.42 thorpej if (error != 0)
175 1.42 thorpej return (error);
176 1.42 thorpej if (newp != NULL) {
177 1.42 thorpej if (newval >= nmbclusters) {
178 1.42 thorpej nmbclusters = newval;
179 1.42 thorpej pool_sethardlimit(&mclpool,
180 1.42 thorpej nmbclusters, mclpool_warnmsg, 60);
181 1.42 thorpej } else
182 1.42 thorpej error = EINVAL;
183 1.42 thorpej }
184 1.42 thorpej return (error);
185 1.42 thorpej } else
186 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, nmbclusters));
187 1.42 thorpej case MBUF_MBLOWAT:
188 1.42 thorpej case MBUF_MCLLOWAT:
189 1.42 thorpej /* New value must be >= 0. */
190 1.42 thorpej newval = (name[0] == MBUF_MBLOWAT) ? mblowat : mcllowat;
191 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen, &newval);
192 1.42 thorpej if (error != 0)
193 1.42 thorpej return (error);
194 1.42 thorpej if (newp != NULL) {
195 1.42 thorpej if (newval >= 0) {
196 1.42 thorpej if (name[0] == MBUF_MBLOWAT) {
197 1.42 thorpej mblowat = newval;
198 1.42 thorpej pool_setlowat(&mbpool, newval);
199 1.42 thorpej } else {
200 1.42 thorpej mcllowat = newval;
201 1.42 thorpej pool_setlowat(&mclpool, newval);
202 1.42 thorpej }
203 1.42 thorpej } else
204 1.42 thorpej error = EINVAL;
205 1.42 thorpej }
206 1.42 thorpej return (error);
207 1.42 thorpej default:
208 1.42 thorpej return (EOPNOTSUPP);
209 1.42 thorpej }
210 1.42 thorpej /* NOTREACHED */
211 1.28 thorpej }
212 1.28 thorpej
213 1.28 thorpej void *
214 1.28 thorpej mclpool_alloc(sz, flags, mtype)
215 1.28 thorpej unsigned long sz;
216 1.28 thorpej int flags;
217 1.28 thorpej int mtype;
218 1.28 thorpej {
219 1.32 thorpej boolean_t waitok = (flags & PR_WAITOK) ? TRUE : FALSE;
220 1.28 thorpej
221 1.39 thorpej return ((void *)uvm_km_alloc_poolpage1(mb_map, uvmexp.mb_object,
222 1.39 thorpej waitok));
223 1.1 cgd }
224 1.1 cgd
225 1.28 thorpej void
226 1.28 thorpej mclpool_release(v, sz, mtype)
227 1.28 thorpej void *v;
228 1.28 thorpej unsigned long sz;
229 1.28 thorpej int mtype;
230 1.1 cgd {
231 1.1 cgd
232 1.31 thorpej uvm_km_free_poolpage1(mb_map, (vaddr_t)v);
233 1.1 cgd }
234 1.1 cgd
235 1.1 cgd /*
236 1.1 cgd * When MGET failes, ask protocols to free space when short of memory,
237 1.1 cgd * then re-attempt to allocate an mbuf.
238 1.1 cgd */
239 1.1 cgd struct mbuf *
240 1.1 cgd m_retry(i, t)
241 1.1 cgd int i, t;
242 1.1 cgd {
243 1.27 matt struct mbuf *m;
244 1.1 cgd
245 1.29 thorpej m_reclaim(i);
246 1.1 cgd #define m_retry(i, t) (struct mbuf *)0
247 1.1 cgd MGET(m, i, t);
248 1.1 cgd #undef m_retry
249 1.18 thorpej if (m != NULL)
250 1.18 thorpej mbstat.m_wait++;
251 1.18 thorpej else
252 1.18 thorpej mbstat.m_drops++;
253 1.1 cgd return (m);
254 1.1 cgd }
255 1.1 cgd
256 1.1 cgd /*
257 1.1 cgd * As above; retry an MGETHDR.
258 1.1 cgd */
259 1.1 cgd struct mbuf *
260 1.1 cgd m_retryhdr(i, t)
261 1.1 cgd int i, t;
262 1.1 cgd {
263 1.27 matt struct mbuf *m;
264 1.1 cgd
265 1.29 thorpej m_reclaim(i);
266 1.1 cgd #define m_retryhdr(i, t) (struct mbuf *)0
267 1.1 cgd MGETHDR(m, i, t);
268 1.1 cgd #undef m_retryhdr
269 1.18 thorpej if (m != NULL)
270 1.18 thorpej mbstat.m_wait++;
271 1.18 thorpej else
272 1.18 thorpej mbstat.m_drops++;
273 1.1 cgd return (m);
274 1.1 cgd }
275 1.1 cgd
276 1.14 christos void
277 1.29 thorpej m_reclaim(how)
278 1.29 thorpej int how;
279 1.1 cgd {
280 1.27 matt struct domain *dp;
281 1.27 matt struct protosw *pr;
282 1.27 matt struct ifnet *ifp;
283 1.1 cgd int s = splimp();
284 1.1 cgd
285 1.33 thorpej for (dp = domains; dp; dp = dp->dom_next)
286 1.33 thorpej for (pr = dp->dom_protosw;
287 1.33 thorpej pr < dp->dom_protoswNPROTOSW; pr++)
288 1.33 thorpej if (pr->pr_drain)
289 1.33 thorpej (*pr->pr_drain)();
290 1.27 matt for (ifp = TAILQ_FIRST(&ifnet); ifp; ifp = TAILQ_NEXT(ifp, if_list))
291 1.27 matt if (ifp->if_drain)
292 1.27 matt (*ifp->if_drain)(ifp);
293 1.1 cgd splx(s);
294 1.1 cgd mbstat.m_drain++;
295 1.1 cgd }
296 1.1 cgd
297 1.1 cgd /*
298 1.1 cgd * Space allocation routines.
299 1.1 cgd * These are also available as macros
300 1.1 cgd * for critical paths.
301 1.1 cgd */
302 1.1 cgd struct mbuf *
303 1.5 cgd m_get(nowait, type)
304 1.5 cgd int nowait, type;
305 1.1 cgd {
306 1.27 matt struct mbuf *m;
307 1.1 cgd
308 1.5 cgd MGET(m, nowait, type);
309 1.1 cgd return (m);
310 1.1 cgd }
311 1.1 cgd
312 1.1 cgd struct mbuf *
313 1.5 cgd m_gethdr(nowait, type)
314 1.5 cgd int nowait, type;
315 1.1 cgd {
316 1.27 matt struct mbuf *m;
317 1.1 cgd
318 1.5 cgd MGETHDR(m, nowait, type);
319 1.1 cgd return (m);
320 1.1 cgd }
321 1.1 cgd
322 1.1 cgd struct mbuf *
323 1.5 cgd m_getclr(nowait, type)
324 1.5 cgd int nowait, type;
325 1.1 cgd {
326 1.27 matt struct mbuf *m;
327 1.1 cgd
328 1.5 cgd MGET(m, nowait, type);
329 1.1 cgd if (m == 0)
330 1.1 cgd return (0);
331 1.30 perry memset(mtod(m, caddr_t), 0, MLEN);
332 1.1 cgd return (m);
333 1.1 cgd }
334 1.1 cgd
335 1.1 cgd struct mbuf *
336 1.1 cgd m_free(m)
337 1.1 cgd struct mbuf *m;
338 1.1 cgd {
339 1.27 matt struct mbuf *n;
340 1.1 cgd
341 1.1 cgd MFREE(m, n);
342 1.1 cgd return (n);
343 1.1 cgd }
344 1.1 cgd
345 1.9 mycroft void
346 1.1 cgd m_freem(m)
347 1.27 matt struct mbuf *m;
348 1.1 cgd {
349 1.27 matt struct mbuf *n;
350 1.1 cgd
351 1.1 cgd if (m == NULL)
352 1.1 cgd return;
353 1.1 cgd do {
354 1.1 cgd MFREE(m, n);
355 1.18 thorpej m = n;
356 1.18 thorpej } while (m);
357 1.1 cgd }
358 1.1 cgd
359 1.1 cgd /*
360 1.1 cgd * Mbuffer utility routines.
361 1.1 cgd */
362 1.1 cgd
363 1.1 cgd /*
364 1.1 cgd * Lesser-used path for M_PREPEND:
365 1.1 cgd * allocate new mbuf to prepend to chain,
366 1.1 cgd * copy junk along.
367 1.1 cgd */
368 1.1 cgd struct mbuf *
369 1.9 mycroft m_prepend(m, len, how)
370 1.27 matt struct mbuf *m;
371 1.9 mycroft int len, how;
372 1.1 cgd {
373 1.1 cgd struct mbuf *mn;
374 1.1 cgd
375 1.9 mycroft MGET(mn, how, m->m_type);
376 1.1 cgd if (mn == (struct mbuf *)NULL) {
377 1.1 cgd m_freem(m);
378 1.1 cgd return ((struct mbuf *)NULL);
379 1.1 cgd }
380 1.1 cgd if (m->m_flags & M_PKTHDR) {
381 1.1 cgd M_COPY_PKTHDR(mn, m);
382 1.1 cgd m->m_flags &= ~M_PKTHDR;
383 1.1 cgd }
384 1.1 cgd mn->m_next = m;
385 1.1 cgd m = mn;
386 1.1 cgd if (len < MHLEN)
387 1.1 cgd MH_ALIGN(m, len);
388 1.1 cgd m->m_len = len;
389 1.1 cgd return (m);
390 1.1 cgd }
391 1.1 cgd
392 1.1 cgd /*
393 1.1 cgd * Make a copy of an mbuf chain starting "off0" bytes from the beginning,
394 1.1 cgd * continuing for "len" bytes. If len is M_COPYALL, copy to end of mbuf.
395 1.1 cgd * The wait parameter is a choice of M_WAIT/M_DONTWAIT from caller.
396 1.1 cgd */
397 1.1 cgd int MCFail;
398 1.1 cgd
399 1.1 cgd struct mbuf *
400 1.1 cgd m_copym(m, off0, len, wait)
401 1.27 matt struct mbuf *m;
402 1.1 cgd int off0, wait;
403 1.27 matt int len;
404 1.1 cgd {
405 1.44 itojun return m_copym0(m, off0, len, wait, 0); /* shallow copy on M_EXT */
406 1.44 itojun }
407 1.44 itojun
408 1.44 itojun struct mbuf *
409 1.44 itojun m_dup(m, off0, len, wait)
410 1.44 itojun struct mbuf *m;
411 1.44 itojun int off0, wait;
412 1.44 itojun int len;
413 1.44 itojun {
414 1.44 itojun return m_copym0(m, off0, len, wait, 1); /* deep copy */
415 1.44 itojun }
416 1.44 itojun
417 1.44 itojun static struct mbuf *
418 1.44 itojun m_copym0(m, off0, len, wait, deep)
419 1.44 itojun struct mbuf *m;
420 1.44 itojun int off0, wait;
421 1.44 itojun int len;
422 1.44 itojun int deep; /* deep copy */
423 1.44 itojun {
424 1.27 matt struct mbuf *n, **np;
425 1.27 matt int off = off0;
426 1.1 cgd struct mbuf *top;
427 1.1 cgd int copyhdr = 0;
428 1.1 cgd
429 1.1 cgd if (off < 0 || len < 0)
430 1.43 thorpej panic("m_copym: off %d, len %d", off, len);
431 1.1 cgd if (off == 0 && m->m_flags & M_PKTHDR)
432 1.1 cgd copyhdr = 1;
433 1.1 cgd while (off > 0) {
434 1.1 cgd if (m == 0)
435 1.43 thorpej panic("m_copym: m == 0");
436 1.1 cgd if (off < m->m_len)
437 1.1 cgd break;
438 1.1 cgd off -= m->m_len;
439 1.1 cgd m = m->m_next;
440 1.1 cgd }
441 1.1 cgd np = ⊤
442 1.1 cgd top = 0;
443 1.1 cgd while (len > 0) {
444 1.1 cgd if (m == 0) {
445 1.1 cgd if (len != M_COPYALL)
446 1.43 thorpej panic("m_copym: m == 0 and not COPYALL");
447 1.1 cgd break;
448 1.1 cgd }
449 1.1 cgd MGET(n, wait, m->m_type);
450 1.1 cgd *np = n;
451 1.1 cgd if (n == 0)
452 1.1 cgd goto nospace;
453 1.1 cgd if (copyhdr) {
454 1.1 cgd M_COPY_PKTHDR(n, m);
455 1.1 cgd if (len == M_COPYALL)
456 1.1 cgd n->m_pkthdr.len -= off0;
457 1.1 cgd else
458 1.1 cgd n->m_pkthdr.len = len;
459 1.1 cgd copyhdr = 0;
460 1.1 cgd }
461 1.9 mycroft n->m_len = min(len, m->m_len - off);
462 1.1 cgd if (m->m_flags & M_EXT) {
463 1.44 itojun if (!deep) {
464 1.44 itojun n->m_data = m->m_data + off;
465 1.44 itojun n->m_ext = m->m_ext;
466 1.44 itojun MCLADDREFERENCE(m, n);
467 1.44 itojun } else {
468 1.44 itojun MCLGET(n, wait);
469 1.44 itojun memcpy(mtod(n, caddr_t), mtod(m, caddr_t)+off,
470 1.44 itojun (unsigned)n->m_len);
471 1.44 itojun }
472 1.1 cgd } else
473 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t)+off,
474 1.1 cgd (unsigned)n->m_len);
475 1.1 cgd if (len != M_COPYALL)
476 1.1 cgd len -= n->m_len;
477 1.1 cgd off = 0;
478 1.1 cgd m = m->m_next;
479 1.1 cgd np = &n->m_next;
480 1.1 cgd }
481 1.1 cgd if (top == 0)
482 1.1 cgd MCFail++;
483 1.1 cgd return (top);
484 1.1 cgd nospace:
485 1.1 cgd m_freem(top);
486 1.1 cgd MCFail++;
487 1.1 cgd return (0);
488 1.1 cgd }
489 1.1 cgd
490 1.1 cgd /*
491 1.18 thorpej * Copy an entire packet, including header (which must be present).
492 1.18 thorpej * An optimization of the common case `m_copym(m, 0, M_COPYALL, how)'.
493 1.18 thorpej */
494 1.18 thorpej struct mbuf *
495 1.18 thorpej m_copypacket(m, how)
496 1.18 thorpej struct mbuf *m;
497 1.18 thorpej int how;
498 1.18 thorpej {
499 1.18 thorpej struct mbuf *top, *n, *o;
500 1.18 thorpej
501 1.18 thorpej MGET(n, how, m->m_type);
502 1.18 thorpej top = n;
503 1.18 thorpej if (!n)
504 1.18 thorpej goto nospace;
505 1.18 thorpej
506 1.18 thorpej M_COPY_PKTHDR(n, m);
507 1.18 thorpej n->m_len = m->m_len;
508 1.18 thorpej if (m->m_flags & M_EXT) {
509 1.18 thorpej n->m_data = m->m_data;
510 1.18 thorpej n->m_ext = m->m_ext;
511 1.18 thorpej MCLADDREFERENCE(m, n);
512 1.18 thorpej } else {
513 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
514 1.18 thorpej }
515 1.18 thorpej
516 1.18 thorpej m = m->m_next;
517 1.18 thorpej while (m) {
518 1.18 thorpej MGET(o, how, m->m_type);
519 1.18 thorpej if (!o)
520 1.18 thorpej goto nospace;
521 1.18 thorpej
522 1.18 thorpej n->m_next = o;
523 1.18 thorpej n = n->m_next;
524 1.18 thorpej
525 1.18 thorpej n->m_len = m->m_len;
526 1.18 thorpej if (m->m_flags & M_EXT) {
527 1.18 thorpej n->m_data = m->m_data;
528 1.18 thorpej n->m_ext = m->m_ext;
529 1.18 thorpej MCLADDREFERENCE(m, n);
530 1.18 thorpej } else {
531 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
532 1.18 thorpej }
533 1.18 thorpej
534 1.18 thorpej m = m->m_next;
535 1.18 thorpej }
536 1.18 thorpej return top;
537 1.18 thorpej nospace:
538 1.18 thorpej m_freem(top);
539 1.18 thorpej MCFail++;
540 1.18 thorpej return 0;
541 1.18 thorpej }
542 1.18 thorpej
543 1.18 thorpej /*
544 1.1 cgd * Copy data from an mbuf chain starting "off" bytes from the beginning,
545 1.1 cgd * continuing for "len" bytes, into the indicated buffer.
546 1.1 cgd */
547 1.14 christos void
548 1.1 cgd m_copydata(m, off, len, cp)
549 1.27 matt struct mbuf *m;
550 1.27 matt int off;
551 1.27 matt int len;
552 1.1 cgd caddr_t cp;
553 1.1 cgd {
554 1.27 matt unsigned count;
555 1.1 cgd
556 1.1 cgd if (off < 0 || len < 0)
557 1.1 cgd panic("m_copydata");
558 1.1 cgd while (off > 0) {
559 1.1 cgd if (m == 0)
560 1.1 cgd panic("m_copydata");
561 1.1 cgd if (off < m->m_len)
562 1.1 cgd break;
563 1.1 cgd off -= m->m_len;
564 1.1 cgd m = m->m_next;
565 1.1 cgd }
566 1.1 cgd while (len > 0) {
567 1.1 cgd if (m == 0)
568 1.1 cgd panic("m_copydata");
569 1.9 mycroft count = min(m->m_len - off, len);
570 1.30 perry memcpy(cp, mtod(m, caddr_t) + off, count);
571 1.1 cgd len -= count;
572 1.1 cgd cp += count;
573 1.1 cgd off = 0;
574 1.1 cgd m = m->m_next;
575 1.1 cgd }
576 1.1 cgd }
577 1.1 cgd
578 1.1 cgd /*
579 1.1 cgd * Concatenate mbuf chain n to m.
580 1.1 cgd * Both chains must be of the same type (e.g. MT_DATA).
581 1.1 cgd * Any m_pkthdr is not updated.
582 1.1 cgd */
583 1.14 christos void
584 1.1 cgd m_cat(m, n)
585 1.27 matt struct mbuf *m, *n;
586 1.1 cgd {
587 1.1 cgd while (m->m_next)
588 1.1 cgd m = m->m_next;
589 1.1 cgd while (n) {
590 1.1 cgd if (m->m_flags & M_EXT ||
591 1.1 cgd m->m_data + m->m_len + n->m_len >= &m->m_dat[MLEN]) {
592 1.1 cgd /* just join the two chains */
593 1.1 cgd m->m_next = n;
594 1.1 cgd return;
595 1.1 cgd }
596 1.1 cgd /* splat the data from one into the other */
597 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
598 1.1 cgd (u_int)n->m_len);
599 1.1 cgd m->m_len += n->m_len;
600 1.1 cgd n = m_free(n);
601 1.1 cgd }
602 1.1 cgd }
603 1.1 cgd
604 1.11 mycroft void
605 1.1 cgd m_adj(mp, req_len)
606 1.1 cgd struct mbuf *mp;
607 1.8 deraadt int req_len;
608 1.1 cgd {
609 1.27 matt int len = req_len;
610 1.27 matt struct mbuf *m;
611 1.27 matt int count;
612 1.1 cgd
613 1.1 cgd if ((m = mp) == NULL)
614 1.1 cgd return;
615 1.1 cgd if (len >= 0) {
616 1.1 cgd /*
617 1.1 cgd * Trim from head.
618 1.1 cgd */
619 1.1 cgd while (m != NULL && len > 0) {
620 1.1 cgd if (m->m_len <= len) {
621 1.1 cgd len -= m->m_len;
622 1.1 cgd m->m_len = 0;
623 1.1 cgd m = m->m_next;
624 1.1 cgd } else {
625 1.1 cgd m->m_len -= len;
626 1.1 cgd m->m_data += len;
627 1.1 cgd len = 0;
628 1.1 cgd }
629 1.1 cgd }
630 1.1 cgd m = mp;
631 1.1 cgd if (mp->m_flags & M_PKTHDR)
632 1.1 cgd m->m_pkthdr.len -= (req_len - len);
633 1.1 cgd } else {
634 1.1 cgd /*
635 1.1 cgd * Trim from tail. Scan the mbuf chain,
636 1.1 cgd * calculating its length and finding the last mbuf.
637 1.1 cgd * If the adjustment only affects this mbuf, then just
638 1.1 cgd * adjust and return. Otherwise, rescan and truncate
639 1.1 cgd * after the remaining size.
640 1.1 cgd */
641 1.1 cgd len = -len;
642 1.1 cgd count = 0;
643 1.1 cgd for (;;) {
644 1.1 cgd count += m->m_len;
645 1.1 cgd if (m->m_next == (struct mbuf *)0)
646 1.1 cgd break;
647 1.1 cgd m = m->m_next;
648 1.1 cgd }
649 1.1 cgd if (m->m_len >= len) {
650 1.1 cgd m->m_len -= len;
651 1.8 deraadt if (mp->m_flags & M_PKTHDR)
652 1.8 deraadt mp->m_pkthdr.len -= len;
653 1.1 cgd return;
654 1.1 cgd }
655 1.1 cgd count -= len;
656 1.1 cgd if (count < 0)
657 1.1 cgd count = 0;
658 1.1 cgd /*
659 1.1 cgd * Correct length for chain is "count".
660 1.1 cgd * Find the mbuf with last data, adjust its length,
661 1.1 cgd * and toss data from remaining mbufs on chain.
662 1.1 cgd */
663 1.1 cgd m = mp;
664 1.1 cgd if (m->m_flags & M_PKTHDR)
665 1.1 cgd m->m_pkthdr.len = count;
666 1.1 cgd for (; m; m = m->m_next) {
667 1.1 cgd if (m->m_len >= count) {
668 1.1 cgd m->m_len = count;
669 1.1 cgd break;
670 1.1 cgd }
671 1.1 cgd count -= m->m_len;
672 1.1 cgd }
673 1.18 thorpej while (m->m_next)
674 1.18 thorpej (m = m->m_next) ->m_len = 0;
675 1.1 cgd }
676 1.1 cgd }
677 1.1 cgd
678 1.1 cgd /*
679 1.1 cgd * Rearange an mbuf chain so that len bytes are contiguous
680 1.1 cgd * and in the data area of an mbuf (so that mtod and dtom
681 1.1 cgd * will work for a structure of size len). Returns the resulting
682 1.1 cgd * mbuf chain on success, frees it and returns null on failure.
683 1.1 cgd * If there is room, it will add up to max_protohdr-len extra bytes to the
684 1.1 cgd * contiguous region in an attempt to avoid being called next time.
685 1.1 cgd */
686 1.1 cgd int MPFail;
687 1.1 cgd
688 1.1 cgd struct mbuf *
689 1.1 cgd m_pullup(n, len)
690 1.27 matt struct mbuf *n;
691 1.1 cgd int len;
692 1.1 cgd {
693 1.27 matt struct mbuf *m;
694 1.27 matt int count;
695 1.1 cgd int space;
696 1.1 cgd
697 1.1 cgd /*
698 1.1 cgd * If first mbuf has no cluster, and has room for len bytes
699 1.1 cgd * without shifting current data, pullup into it,
700 1.1 cgd * otherwise allocate a new mbuf to prepend to the chain.
701 1.1 cgd */
702 1.1 cgd if ((n->m_flags & M_EXT) == 0 &&
703 1.1 cgd n->m_data + len < &n->m_dat[MLEN] && n->m_next) {
704 1.1 cgd if (n->m_len >= len)
705 1.1 cgd return (n);
706 1.1 cgd m = n;
707 1.1 cgd n = n->m_next;
708 1.1 cgd len -= m->m_len;
709 1.1 cgd } else {
710 1.1 cgd if (len > MHLEN)
711 1.1 cgd goto bad;
712 1.1 cgd MGET(m, M_DONTWAIT, n->m_type);
713 1.1 cgd if (m == 0)
714 1.1 cgd goto bad;
715 1.1 cgd m->m_len = 0;
716 1.1 cgd if (n->m_flags & M_PKTHDR) {
717 1.1 cgd M_COPY_PKTHDR(m, n);
718 1.1 cgd n->m_flags &= ~M_PKTHDR;
719 1.1 cgd }
720 1.1 cgd }
721 1.1 cgd space = &m->m_dat[MLEN] - (m->m_data + m->m_len);
722 1.1 cgd do {
723 1.1 cgd count = min(min(max(len, max_protohdr), space), n->m_len);
724 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
725 1.1 cgd (unsigned)count);
726 1.1 cgd len -= count;
727 1.1 cgd m->m_len += count;
728 1.1 cgd n->m_len -= count;
729 1.1 cgd space -= count;
730 1.1 cgd if (n->m_len)
731 1.1 cgd n->m_data += count;
732 1.1 cgd else
733 1.1 cgd n = m_free(n);
734 1.1 cgd } while (len > 0 && n);
735 1.1 cgd if (len > 0) {
736 1.1 cgd (void) m_free(m);
737 1.1 cgd goto bad;
738 1.1 cgd }
739 1.1 cgd m->m_next = n;
740 1.1 cgd return (m);
741 1.1 cgd bad:
742 1.1 cgd m_freem(n);
743 1.1 cgd MPFail++;
744 1.1 cgd return (0);
745 1.9 mycroft }
746 1.9 mycroft
747 1.9 mycroft /*
748 1.9 mycroft * Partition an mbuf chain in two pieces, returning the tail --
749 1.9 mycroft * all but the first len0 bytes. In case of failure, it returns NULL and
750 1.9 mycroft * attempts to restore the chain to its original state.
751 1.9 mycroft */
752 1.9 mycroft struct mbuf *
753 1.9 mycroft m_split(m0, len0, wait)
754 1.27 matt struct mbuf *m0;
755 1.9 mycroft int len0, wait;
756 1.9 mycroft {
757 1.27 matt struct mbuf *m, *n;
758 1.22 thorpej unsigned len = len0, remain, len_save;
759 1.9 mycroft
760 1.9 mycroft for (m = m0; m && len > m->m_len; m = m->m_next)
761 1.9 mycroft len -= m->m_len;
762 1.9 mycroft if (m == 0)
763 1.9 mycroft return (0);
764 1.9 mycroft remain = m->m_len - len;
765 1.9 mycroft if (m0->m_flags & M_PKTHDR) {
766 1.9 mycroft MGETHDR(n, wait, m0->m_type);
767 1.9 mycroft if (n == 0)
768 1.9 mycroft return (0);
769 1.9 mycroft n->m_pkthdr.rcvif = m0->m_pkthdr.rcvif;
770 1.9 mycroft n->m_pkthdr.len = m0->m_pkthdr.len - len0;
771 1.22 thorpej len_save = m0->m_pkthdr.len;
772 1.9 mycroft m0->m_pkthdr.len = len0;
773 1.9 mycroft if (m->m_flags & M_EXT)
774 1.9 mycroft goto extpacket;
775 1.9 mycroft if (remain > MHLEN) {
776 1.9 mycroft /* m can't be the lead packet */
777 1.9 mycroft MH_ALIGN(n, 0);
778 1.9 mycroft n->m_next = m_split(m, len, wait);
779 1.9 mycroft if (n->m_next == 0) {
780 1.9 mycroft (void) m_free(n);
781 1.22 thorpej m0->m_pkthdr.len = len_save;
782 1.9 mycroft return (0);
783 1.9 mycroft } else
784 1.9 mycroft return (n);
785 1.9 mycroft } else
786 1.9 mycroft MH_ALIGN(n, remain);
787 1.9 mycroft } else if (remain == 0) {
788 1.9 mycroft n = m->m_next;
789 1.9 mycroft m->m_next = 0;
790 1.9 mycroft return (n);
791 1.9 mycroft } else {
792 1.9 mycroft MGET(n, wait, m->m_type);
793 1.9 mycroft if (n == 0)
794 1.9 mycroft return (0);
795 1.9 mycroft M_ALIGN(n, remain);
796 1.9 mycroft }
797 1.9 mycroft extpacket:
798 1.9 mycroft if (m->m_flags & M_EXT) {
799 1.9 mycroft n->m_ext = m->m_ext;
800 1.18 thorpej MCLADDREFERENCE(m, n);
801 1.9 mycroft n->m_data = m->m_data + len;
802 1.9 mycroft } else {
803 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + len, remain);
804 1.9 mycroft }
805 1.9 mycroft n->m_len = remain;
806 1.9 mycroft m->m_len = len;
807 1.9 mycroft n->m_next = m->m_next;
808 1.9 mycroft m->m_next = 0;
809 1.9 mycroft return (n);
810 1.9 mycroft }
811 1.9 mycroft /*
812 1.9 mycroft * Routine to copy from device local memory into mbufs.
813 1.9 mycroft */
814 1.9 mycroft struct mbuf *
815 1.9 mycroft m_devget(buf, totlen, off0, ifp, copy)
816 1.9 mycroft char *buf;
817 1.9 mycroft int totlen, off0;
818 1.9 mycroft struct ifnet *ifp;
819 1.18 thorpej void (*copy) __P((const void *from, void *to, size_t len));
820 1.9 mycroft {
821 1.27 matt struct mbuf *m;
822 1.9 mycroft struct mbuf *top = 0, **mp = ⊤
823 1.27 matt int off = off0, len;
824 1.27 matt char *cp;
825 1.9 mycroft char *epkt;
826 1.9 mycroft
827 1.9 mycroft cp = buf;
828 1.9 mycroft epkt = cp + totlen;
829 1.9 mycroft if (off) {
830 1.13 cgd /*
831 1.13 cgd * If 'off' is non-zero, packet is trailer-encapsulated,
832 1.13 cgd * so we have to skip the type and length fields.
833 1.13 cgd */
834 1.13 cgd cp += off + 2 * sizeof(u_int16_t);
835 1.13 cgd totlen -= 2 * sizeof(u_int16_t);
836 1.9 mycroft }
837 1.9 mycroft MGETHDR(m, M_DONTWAIT, MT_DATA);
838 1.9 mycroft if (m == 0)
839 1.9 mycroft return (0);
840 1.9 mycroft m->m_pkthdr.rcvif = ifp;
841 1.9 mycroft m->m_pkthdr.len = totlen;
842 1.9 mycroft m->m_len = MHLEN;
843 1.9 mycroft
844 1.9 mycroft while (totlen > 0) {
845 1.9 mycroft if (top) {
846 1.9 mycroft MGET(m, M_DONTWAIT, MT_DATA);
847 1.9 mycroft if (m == 0) {
848 1.9 mycroft m_freem(top);
849 1.9 mycroft return (0);
850 1.9 mycroft }
851 1.9 mycroft m->m_len = MLEN;
852 1.9 mycroft }
853 1.9 mycroft len = min(totlen, epkt - cp);
854 1.9 mycroft if (len >= MINCLSIZE) {
855 1.9 mycroft MCLGET(m, M_DONTWAIT);
856 1.19 mycroft if ((m->m_flags & M_EXT) == 0) {
857 1.20 mycroft m_free(m);
858 1.19 mycroft m_freem(top);
859 1.19 mycroft return (0);
860 1.19 mycroft }
861 1.19 mycroft m->m_len = len = min(len, MCLBYTES);
862 1.9 mycroft } else {
863 1.9 mycroft /*
864 1.9 mycroft * Place initial small packet/header at end of mbuf.
865 1.9 mycroft */
866 1.9 mycroft if (len < m->m_len) {
867 1.9 mycroft if (top == 0 && len + max_linkhdr <= m->m_len)
868 1.9 mycroft m->m_data += max_linkhdr;
869 1.9 mycroft m->m_len = len;
870 1.9 mycroft } else
871 1.9 mycroft len = m->m_len;
872 1.9 mycroft }
873 1.9 mycroft if (copy)
874 1.14 christos copy(cp, mtod(m, caddr_t), (size_t)len);
875 1.9 mycroft else
876 1.30 perry memcpy(mtod(m, caddr_t), cp, (size_t)len);
877 1.9 mycroft cp += len;
878 1.9 mycroft *mp = m;
879 1.9 mycroft mp = &m->m_next;
880 1.9 mycroft totlen -= len;
881 1.9 mycroft if (cp == epkt)
882 1.9 mycroft cp = buf;
883 1.9 mycroft }
884 1.9 mycroft return (top);
885 1.18 thorpej }
886 1.18 thorpej
887 1.18 thorpej /*
888 1.18 thorpej * Copy data from a buffer back into the indicated mbuf chain,
889 1.18 thorpej * starting "off" bytes from the beginning, extending the mbuf
890 1.18 thorpej * chain if necessary.
891 1.18 thorpej */
892 1.18 thorpej void
893 1.18 thorpej m_copyback(m0, off, len, cp)
894 1.18 thorpej struct mbuf *m0;
895 1.27 matt int off;
896 1.27 matt int len;
897 1.18 thorpej caddr_t cp;
898 1.18 thorpej {
899 1.27 matt int mlen;
900 1.27 matt struct mbuf *m = m0, *n;
901 1.18 thorpej int totlen = 0;
902 1.18 thorpej
903 1.18 thorpej if (m0 == 0)
904 1.18 thorpej return;
905 1.18 thorpej while (off > (mlen = m->m_len)) {
906 1.18 thorpej off -= mlen;
907 1.18 thorpej totlen += mlen;
908 1.18 thorpej if (m->m_next == 0) {
909 1.18 thorpej n = m_getclr(M_DONTWAIT, m->m_type);
910 1.18 thorpej if (n == 0)
911 1.18 thorpej goto out;
912 1.18 thorpej n->m_len = min(MLEN, len + off);
913 1.18 thorpej m->m_next = n;
914 1.18 thorpej }
915 1.18 thorpej m = m->m_next;
916 1.18 thorpej }
917 1.18 thorpej while (len > 0) {
918 1.18 thorpej mlen = min (m->m_len - off, len);
919 1.30 perry memcpy(mtod(m, caddr_t) + off, cp, (unsigned)mlen);
920 1.18 thorpej cp += mlen;
921 1.18 thorpej len -= mlen;
922 1.18 thorpej mlen += off;
923 1.18 thorpej off = 0;
924 1.18 thorpej totlen += mlen;
925 1.18 thorpej if (len == 0)
926 1.18 thorpej break;
927 1.18 thorpej if (m->m_next == 0) {
928 1.18 thorpej n = m_get(M_DONTWAIT, m->m_type);
929 1.18 thorpej if (n == 0)
930 1.18 thorpej break;
931 1.18 thorpej n->m_len = min(MLEN, len);
932 1.18 thorpej m->m_next = n;
933 1.18 thorpej }
934 1.18 thorpej m = m->m_next;
935 1.18 thorpej }
936 1.18 thorpej out: if (((m = m0)->m_flags & M_PKTHDR) && (m->m_pkthdr.len < totlen))
937 1.18 thorpej m->m_pkthdr.len = totlen;
938 1.1 cgd }
939