uipc_mbuf.c revision 1.55 1 1.55 simonb /* $NetBSD: uipc_mbuf.c,v 1.55 2001/10/29 07:02:31 simonb Exp $ */
2 1.42 thorpej
3 1.42 thorpej /*-
4 1.53 thorpej * Copyright (c) 1999, 2001 The NetBSD Foundation, Inc.
5 1.42 thorpej * All rights reserved.
6 1.42 thorpej *
7 1.42 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.42 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.42 thorpej * NASA Ames Research Center.
10 1.42 thorpej *
11 1.42 thorpej * Redistribution and use in source and binary forms, with or without
12 1.42 thorpej * modification, are permitted provided that the following conditions
13 1.42 thorpej * are met:
14 1.42 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.42 thorpej * notice, this list of conditions and the following disclaimer.
16 1.42 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.42 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.42 thorpej * documentation and/or other materials provided with the distribution.
19 1.42 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.42 thorpej * must display the following acknowledgement:
21 1.42 thorpej * This product includes software developed by the NetBSD
22 1.42 thorpej * Foundation, Inc. and its contributors.
23 1.42 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.42 thorpej * contributors may be used to endorse or promote products derived
25 1.42 thorpej * from this software without specific prior written permission.
26 1.42 thorpej *
27 1.42 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.42 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.42 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.42 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.42 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.42 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.42 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.42 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.42 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.42 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.42 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.42 thorpej */
39 1.10 cgd
40 1.1 cgd /*
41 1.9 mycroft * Copyright (c) 1982, 1986, 1988, 1991, 1993
42 1.9 mycroft * The Regents of the University of California. All rights reserved.
43 1.1 cgd *
44 1.1 cgd * Redistribution and use in source and binary forms, with or without
45 1.1 cgd * modification, are permitted provided that the following conditions
46 1.1 cgd * are met:
47 1.1 cgd * 1. Redistributions of source code must retain the above copyright
48 1.1 cgd * notice, this list of conditions and the following disclaimer.
49 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
50 1.1 cgd * notice, this list of conditions and the following disclaimer in the
51 1.1 cgd * documentation and/or other materials provided with the distribution.
52 1.1 cgd * 3. All advertising materials mentioning features or use of this software
53 1.1 cgd * must display the following acknowledgement:
54 1.1 cgd * This product includes software developed by the University of
55 1.1 cgd * California, Berkeley and its contributors.
56 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
57 1.1 cgd * may be used to endorse or promote products derived from this software
58 1.1 cgd * without specific prior written permission.
59 1.1 cgd *
60 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
61 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
62 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
63 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
64 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
65 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
66 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
67 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
68 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
69 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
70 1.1 cgd * SUCH DAMAGE.
71 1.1 cgd *
72 1.26 fvdl * @(#)uipc_mbuf.c 8.4 (Berkeley) 2/14/95
73 1.1 cgd */
74 1.24 mrg
75 1.6 mycroft #include <sys/param.h>
76 1.6 mycroft #include <sys/systm.h>
77 1.6 mycroft #include <sys/proc.h>
78 1.6 mycroft #include <sys/malloc.h>
79 1.9 mycroft #include <sys/map.h>
80 1.1 cgd #define MBTYPES
81 1.6 mycroft #include <sys/mbuf.h>
82 1.6 mycroft #include <sys/kernel.h>
83 1.6 mycroft #include <sys/syslog.h>
84 1.6 mycroft #include <sys/domain.h>
85 1.6 mycroft #include <sys/protosw.h>
86 1.28 thorpej #include <sys/pool.h>
87 1.27 matt #include <sys/socket.h>
88 1.55 simonb #include <sys/sysctl.h>
89 1.55 simonb
90 1.27 matt #include <net/if.h>
91 1.14 christos
92 1.23 mrg #include <uvm/uvm_extern.h>
93 1.23 mrg
94 1.42 thorpej
95 1.28 thorpej struct pool mbpool; /* mbuf pool */
96 1.28 thorpej struct pool mclpool; /* mbuf cluster pool */
97 1.28 thorpej
98 1.53 thorpej struct pool_cache mbpool_cache;
99 1.53 thorpej struct pool_cache mclpool_cache;
100 1.53 thorpej
101 1.18 thorpej struct mbstat mbstat;
102 1.18 thorpej int max_linkhdr;
103 1.18 thorpej int max_protohdr;
104 1.18 thorpej int max_hdr;
105 1.18 thorpej int max_datalen;
106 1.18 thorpej
107 1.28 thorpej void *mclpool_alloc __P((unsigned long, int, int));
108 1.28 thorpej void mclpool_release __P((void *, unsigned long, int));
109 1.44 itojun static struct mbuf *m_copym0 __P((struct mbuf *, int, int, int, int));
110 1.28 thorpej
111 1.42 thorpej const char *mclpool_warnmsg =
112 1.42 thorpej "WARNING: mclpool limit reached; increase NMBCLUSTERS";
113 1.42 thorpej
114 1.28 thorpej /*
115 1.40 thorpej * Initialize the mbuf allcator.
116 1.28 thorpej */
117 1.4 jtc void
118 1.1 cgd mbinit()
119 1.1 cgd {
120 1.1 cgd
121 1.42 thorpej pool_init(&mbpool, msize, 0, 0, 0, "mbpl", 0, NULL, NULL, 0);
122 1.42 thorpej pool_init(&mclpool, mclbytes, 0, 0, 0, "mclpl", 0, mclpool_alloc,
123 1.28 thorpej mclpool_release, 0);
124 1.53 thorpej
125 1.53 thorpej pool_cache_init(&mbpool_cache, &mbpool, NULL, NULL, NULL);
126 1.53 thorpej pool_cache_init(&mclpool_cache, &mclpool, NULL, NULL, NULL);
127 1.37 thorpej
128 1.37 thorpej /*
129 1.39 thorpej * Set the hard limit on the mclpool to the number of
130 1.39 thorpej * mbuf clusters the kernel is to support. Log the limit
131 1.39 thorpej * reached message max once a minute.
132 1.39 thorpej */
133 1.42 thorpej pool_sethardlimit(&mclpool, nmbclusters, mclpool_warnmsg, 60);
134 1.42 thorpej
135 1.39 thorpej /*
136 1.42 thorpej * Set a low water mark for both mbufs and clusters. This should
137 1.42 thorpej * help ensure that they can be allocated in a memory starvation
138 1.42 thorpej * situation. This is important for e.g. diskless systems which
139 1.42 thorpej * must allocate mbufs in order for the pagedaemon to clean pages.
140 1.37 thorpej */
141 1.42 thorpej pool_setlowat(&mbpool, mblowat);
142 1.42 thorpej pool_setlowat(&mclpool, mcllowat);
143 1.42 thorpej }
144 1.42 thorpej
145 1.42 thorpej int
146 1.42 thorpej sysctl_dombuf(name, namelen, oldp, oldlenp, newp, newlen)
147 1.42 thorpej int *name;
148 1.42 thorpej u_int namelen;
149 1.42 thorpej void *oldp;
150 1.42 thorpej size_t *oldlenp;
151 1.42 thorpej void *newp;
152 1.42 thorpej size_t newlen;
153 1.42 thorpej {
154 1.42 thorpej int error, newval;
155 1.42 thorpej
156 1.42 thorpej /* All sysctl names at this level are terminal. */
157 1.42 thorpej if (namelen != 1)
158 1.42 thorpej return (ENOTDIR); /* overloaded */
159 1.42 thorpej
160 1.42 thorpej switch (name[0]) {
161 1.42 thorpej case MBUF_MSIZE:
162 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, msize));
163 1.42 thorpej case MBUF_MCLBYTES:
164 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, mclbytes));
165 1.42 thorpej case MBUF_NMBCLUSTERS:
166 1.42 thorpej /*
167 1.42 thorpej * If we have direct-mapped pool pages, we can adjust this
168 1.42 thorpej * number on the fly. If not, we're limited by the size
169 1.42 thorpej * of mb_map, and cannot change this value.
170 1.42 thorpej *
171 1.42 thorpej * Note: we only allow the value to be increased, never
172 1.42 thorpej * decreased.
173 1.42 thorpej */
174 1.42 thorpej if (mb_map == NULL) {
175 1.42 thorpej newval = nmbclusters;
176 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen,
177 1.42 thorpej &newval);
178 1.42 thorpej if (error != 0)
179 1.42 thorpej return (error);
180 1.42 thorpej if (newp != NULL) {
181 1.42 thorpej if (newval >= nmbclusters) {
182 1.42 thorpej nmbclusters = newval;
183 1.42 thorpej pool_sethardlimit(&mclpool,
184 1.42 thorpej nmbclusters, mclpool_warnmsg, 60);
185 1.42 thorpej } else
186 1.42 thorpej error = EINVAL;
187 1.42 thorpej }
188 1.42 thorpej return (error);
189 1.42 thorpej } else
190 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, nmbclusters));
191 1.42 thorpej case MBUF_MBLOWAT:
192 1.42 thorpej case MBUF_MCLLOWAT:
193 1.42 thorpej /* New value must be >= 0. */
194 1.42 thorpej newval = (name[0] == MBUF_MBLOWAT) ? mblowat : mcllowat;
195 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen, &newval);
196 1.42 thorpej if (error != 0)
197 1.42 thorpej return (error);
198 1.42 thorpej if (newp != NULL) {
199 1.42 thorpej if (newval >= 0) {
200 1.42 thorpej if (name[0] == MBUF_MBLOWAT) {
201 1.42 thorpej mblowat = newval;
202 1.42 thorpej pool_setlowat(&mbpool, newval);
203 1.42 thorpej } else {
204 1.42 thorpej mcllowat = newval;
205 1.42 thorpej pool_setlowat(&mclpool, newval);
206 1.42 thorpej }
207 1.42 thorpej } else
208 1.42 thorpej error = EINVAL;
209 1.42 thorpej }
210 1.42 thorpej return (error);
211 1.42 thorpej default:
212 1.42 thorpej return (EOPNOTSUPP);
213 1.42 thorpej }
214 1.42 thorpej /* NOTREACHED */
215 1.28 thorpej }
216 1.28 thorpej
217 1.28 thorpej void *
218 1.28 thorpej mclpool_alloc(sz, flags, mtype)
219 1.28 thorpej unsigned long sz;
220 1.28 thorpej int flags;
221 1.28 thorpej int mtype;
222 1.28 thorpej {
223 1.32 thorpej boolean_t waitok = (flags & PR_WAITOK) ? TRUE : FALSE;
224 1.28 thorpej
225 1.54 chs return ((void *)uvm_km_alloc_poolpage1(mb_map, NULL, waitok));
226 1.1 cgd }
227 1.1 cgd
228 1.28 thorpej void
229 1.28 thorpej mclpool_release(v, sz, mtype)
230 1.28 thorpej void *v;
231 1.28 thorpej unsigned long sz;
232 1.28 thorpej int mtype;
233 1.1 cgd {
234 1.1 cgd
235 1.31 thorpej uvm_km_free_poolpage1(mb_map, (vaddr_t)v);
236 1.1 cgd }
237 1.1 cgd
238 1.1 cgd /*
239 1.1 cgd * When MGET failes, ask protocols to free space when short of memory,
240 1.1 cgd * then re-attempt to allocate an mbuf.
241 1.1 cgd */
242 1.1 cgd struct mbuf *
243 1.1 cgd m_retry(i, t)
244 1.1 cgd int i, t;
245 1.1 cgd {
246 1.27 matt struct mbuf *m;
247 1.1 cgd
248 1.29 thorpej m_reclaim(i);
249 1.1 cgd #define m_retry(i, t) (struct mbuf *)0
250 1.1 cgd MGET(m, i, t);
251 1.1 cgd #undef m_retry
252 1.18 thorpej if (m != NULL)
253 1.18 thorpej mbstat.m_wait++;
254 1.18 thorpej else
255 1.18 thorpej mbstat.m_drops++;
256 1.1 cgd return (m);
257 1.1 cgd }
258 1.1 cgd
259 1.1 cgd /*
260 1.1 cgd * As above; retry an MGETHDR.
261 1.1 cgd */
262 1.1 cgd struct mbuf *
263 1.1 cgd m_retryhdr(i, t)
264 1.1 cgd int i, t;
265 1.1 cgd {
266 1.27 matt struct mbuf *m;
267 1.1 cgd
268 1.29 thorpej m_reclaim(i);
269 1.1 cgd #define m_retryhdr(i, t) (struct mbuf *)0
270 1.1 cgd MGETHDR(m, i, t);
271 1.1 cgd #undef m_retryhdr
272 1.18 thorpej if (m != NULL)
273 1.18 thorpej mbstat.m_wait++;
274 1.18 thorpej else
275 1.18 thorpej mbstat.m_drops++;
276 1.1 cgd return (m);
277 1.1 cgd }
278 1.1 cgd
279 1.14 christos void
280 1.29 thorpej m_reclaim(how)
281 1.29 thorpej int how;
282 1.1 cgd {
283 1.27 matt struct domain *dp;
284 1.27 matt struct protosw *pr;
285 1.27 matt struct ifnet *ifp;
286 1.52 thorpej int s = splvm();
287 1.1 cgd
288 1.33 thorpej for (dp = domains; dp; dp = dp->dom_next)
289 1.33 thorpej for (pr = dp->dom_protosw;
290 1.33 thorpej pr < dp->dom_protoswNPROTOSW; pr++)
291 1.33 thorpej if (pr->pr_drain)
292 1.33 thorpej (*pr->pr_drain)();
293 1.27 matt for (ifp = TAILQ_FIRST(&ifnet); ifp; ifp = TAILQ_NEXT(ifp, if_list))
294 1.27 matt if (ifp->if_drain)
295 1.27 matt (*ifp->if_drain)(ifp);
296 1.1 cgd splx(s);
297 1.1 cgd mbstat.m_drain++;
298 1.1 cgd }
299 1.1 cgd
300 1.1 cgd /*
301 1.1 cgd * Space allocation routines.
302 1.1 cgd * These are also available as macros
303 1.1 cgd * for critical paths.
304 1.1 cgd */
305 1.1 cgd struct mbuf *
306 1.5 cgd m_get(nowait, type)
307 1.5 cgd int nowait, type;
308 1.1 cgd {
309 1.27 matt struct mbuf *m;
310 1.1 cgd
311 1.5 cgd MGET(m, nowait, type);
312 1.1 cgd return (m);
313 1.1 cgd }
314 1.1 cgd
315 1.1 cgd struct mbuf *
316 1.5 cgd m_gethdr(nowait, type)
317 1.5 cgd int nowait, type;
318 1.1 cgd {
319 1.27 matt struct mbuf *m;
320 1.1 cgd
321 1.5 cgd MGETHDR(m, nowait, type);
322 1.1 cgd return (m);
323 1.1 cgd }
324 1.1 cgd
325 1.1 cgd struct mbuf *
326 1.5 cgd m_getclr(nowait, type)
327 1.5 cgd int nowait, type;
328 1.1 cgd {
329 1.27 matt struct mbuf *m;
330 1.1 cgd
331 1.5 cgd MGET(m, nowait, type);
332 1.1 cgd if (m == 0)
333 1.1 cgd return (0);
334 1.30 perry memset(mtod(m, caddr_t), 0, MLEN);
335 1.1 cgd return (m);
336 1.1 cgd }
337 1.1 cgd
338 1.1 cgd struct mbuf *
339 1.1 cgd m_free(m)
340 1.1 cgd struct mbuf *m;
341 1.1 cgd {
342 1.27 matt struct mbuf *n;
343 1.1 cgd
344 1.1 cgd MFREE(m, n);
345 1.1 cgd return (n);
346 1.1 cgd }
347 1.1 cgd
348 1.9 mycroft void
349 1.1 cgd m_freem(m)
350 1.27 matt struct mbuf *m;
351 1.1 cgd {
352 1.27 matt struct mbuf *n;
353 1.1 cgd
354 1.1 cgd if (m == NULL)
355 1.1 cgd return;
356 1.1 cgd do {
357 1.1 cgd MFREE(m, n);
358 1.18 thorpej m = n;
359 1.18 thorpej } while (m);
360 1.1 cgd }
361 1.1 cgd
362 1.1 cgd /*
363 1.1 cgd * Mbuffer utility routines.
364 1.1 cgd */
365 1.1 cgd
366 1.1 cgd /*
367 1.1 cgd * Lesser-used path for M_PREPEND:
368 1.1 cgd * allocate new mbuf to prepend to chain,
369 1.1 cgd * copy junk along.
370 1.1 cgd */
371 1.1 cgd struct mbuf *
372 1.9 mycroft m_prepend(m, len, how)
373 1.27 matt struct mbuf *m;
374 1.9 mycroft int len, how;
375 1.1 cgd {
376 1.1 cgd struct mbuf *mn;
377 1.1 cgd
378 1.9 mycroft MGET(mn, how, m->m_type);
379 1.1 cgd if (mn == (struct mbuf *)NULL) {
380 1.1 cgd m_freem(m);
381 1.1 cgd return ((struct mbuf *)NULL);
382 1.1 cgd }
383 1.1 cgd if (m->m_flags & M_PKTHDR) {
384 1.1 cgd M_COPY_PKTHDR(mn, m);
385 1.1 cgd m->m_flags &= ~M_PKTHDR;
386 1.1 cgd }
387 1.1 cgd mn->m_next = m;
388 1.1 cgd m = mn;
389 1.1 cgd if (len < MHLEN)
390 1.1 cgd MH_ALIGN(m, len);
391 1.1 cgd m->m_len = len;
392 1.1 cgd return (m);
393 1.1 cgd }
394 1.1 cgd
395 1.1 cgd /*
396 1.1 cgd * Make a copy of an mbuf chain starting "off0" bytes from the beginning,
397 1.1 cgd * continuing for "len" bytes. If len is M_COPYALL, copy to end of mbuf.
398 1.1 cgd * The wait parameter is a choice of M_WAIT/M_DONTWAIT from caller.
399 1.1 cgd */
400 1.1 cgd int MCFail;
401 1.1 cgd
402 1.1 cgd struct mbuf *
403 1.1 cgd m_copym(m, off0, len, wait)
404 1.27 matt struct mbuf *m;
405 1.1 cgd int off0, wait;
406 1.27 matt int len;
407 1.1 cgd {
408 1.44 itojun return m_copym0(m, off0, len, wait, 0); /* shallow copy on M_EXT */
409 1.44 itojun }
410 1.44 itojun
411 1.44 itojun struct mbuf *
412 1.44 itojun m_dup(m, off0, len, wait)
413 1.44 itojun struct mbuf *m;
414 1.44 itojun int off0, wait;
415 1.44 itojun int len;
416 1.44 itojun {
417 1.44 itojun return m_copym0(m, off0, len, wait, 1); /* deep copy */
418 1.44 itojun }
419 1.44 itojun
420 1.44 itojun static struct mbuf *
421 1.44 itojun m_copym0(m, off0, len, wait, deep)
422 1.44 itojun struct mbuf *m;
423 1.44 itojun int off0, wait;
424 1.44 itojun int len;
425 1.44 itojun int deep; /* deep copy */
426 1.44 itojun {
427 1.27 matt struct mbuf *n, **np;
428 1.27 matt int off = off0;
429 1.1 cgd struct mbuf *top;
430 1.1 cgd int copyhdr = 0;
431 1.1 cgd
432 1.1 cgd if (off < 0 || len < 0)
433 1.43 thorpej panic("m_copym: off %d, len %d", off, len);
434 1.1 cgd if (off == 0 && m->m_flags & M_PKTHDR)
435 1.1 cgd copyhdr = 1;
436 1.1 cgd while (off > 0) {
437 1.1 cgd if (m == 0)
438 1.43 thorpej panic("m_copym: m == 0");
439 1.1 cgd if (off < m->m_len)
440 1.1 cgd break;
441 1.1 cgd off -= m->m_len;
442 1.1 cgd m = m->m_next;
443 1.1 cgd }
444 1.1 cgd np = ⊤
445 1.1 cgd top = 0;
446 1.1 cgd while (len > 0) {
447 1.1 cgd if (m == 0) {
448 1.1 cgd if (len != M_COPYALL)
449 1.43 thorpej panic("m_copym: m == 0 and not COPYALL");
450 1.1 cgd break;
451 1.1 cgd }
452 1.1 cgd MGET(n, wait, m->m_type);
453 1.1 cgd *np = n;
454 1.1 cgd if (n == 0)
455 1.1 cgd goto nospace;
456 1.1 cgd if (copyhdr) {
457 1.1 cgd M_COPY_PKTHDR(n, m);
458 1.1 cgd if (len == M_COPYALL)
459 1.1 cgd n->m_pkthdr.len -= off0;
460 1.1 cgd else
461 1.1 cgd n->m_pkthdr.len = len;
462 1.1 cgd copyhdr = 0;
463 1.1 cgd }
464 1.9 mycroft n->m_len = min(len, m->m_len - off);
465 1.1 cgd if (m->m_flags & M_EXT) {
466 1.44 itojun if (!deep) {
467 1.44 itojun n->m_data = m->m_data + off;
468 1.44 itojun n->m_ext = m->m_ext;
469 1.44 itojun MCLADDREFERENCE(m, n);
470 1.44 itojun } else {
471 1.48 itojun /*
472 1.50 itojun * we are unsure about the way m was allocated.
473 1.50 itojun * copy into multiple MCLBYTES cluster mbufs.
474 1.48 itojun */
475 1.44 itojun MCLGET(n, wait);
476 1.50 itojun n->m_len = 0;
477 1.50 itojun n->m_len = M_TRAILINGSPACE(n);
478 1.50 itojun n->m_len = min(n->m_len, len);
479 1.50 itojun n->m_len = min(n->m_len, m->m_len - off);
480 1.50 itojun memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + off,
481 1.44 itojun (unsigned)n->m_len);
482 1.44 itojun }
483 1.1 cgd } else
484 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t)+off,
485 1.1 cgd (unsigned)n->m_len);
486 1.1 cgd if (len != M_COPYALL)
487 1.1 cgd len -= n->m_len;
488 1.50 itojun off += n->m_len;
489 1.50 itojun #ifdef DIAGNOSTIC
490 1.50 itojun if (off > m->m_len)
491 1.50 itojun panic("m_copym0 overrun");
492 1.50 itojun #endif
493 1.50 itojun if (off == m->m_len) {
494 1.50 itojun m = m->m_next;
495 1.50 itojun off = 0;
496 1.50 itojun }
497 1.1 cgd np = &n->m_next;
498 1.1 cgd }
499 1.1 cgd if (top == 0)
500 1.1 cgd MCFail++;
501 1.1 cgd return (top);
502 1.1 cgd nospace:
503 1.1 cgd m_freem(top);
504 1.1 cgd MCFail++;
505 1.1 cgd return (0);
506 1.1 cgd }
507 1.1 cgd
508 1.1 cgd /*
509 1.18 thorpej * Copy an entire packet, including header (which must be present).
510 1.18 thorpej * An optimization of the common case `m_copym(m, 0, M_COPYALL, how)'.
511 1.18 thorpej */
512 1.18 thorpej struct mbuf *
513 1.18 thorpej m_copypacket(m, how)
514 1.18 thorpej struct mbuf *m;
515 1.18 thorpej int how;
516 1.18 thorpej {
517 1.18 thorpej struct mbuf *top, *n, *o;
518 1.18 thorpej
519 1.18 thorpej MGET(n, how, m->m_type);
520 1.18 thorpej top = n;
521 1.18 thorpej if (!n)
522 1.18 thorpej goto nospace;
523 1.18 thorpej
524 1.18 thorpej M_COPY_PKTHDR(n, m);
525 1.18 thorpej n->m_len = m->m_len;
526 1.18 thorpej if (m->m_flags & M_EXT) {
527 1.18 thorpej n->m_data = m->m_data;
528 1.18 thorpej n->m_ext = m->m_ext;
529 1.18 thorpej MCLADDREFERENCE(m, n);
530 1.18 thorpej } else {
531 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
532 1.18 thorpej }
533 1.18 thorpej
534 1.18 thorpej m = m->m_next;
535 1.18 thorpej while (m) {
536 1.18 thorpej MGET(o, how, m->m_type);
537 1.18 thorpej if (!o)
538 1.18 thorpej goto nospace;
539 1.18 thorpej
540 1.18 thorpej n->m_next = o;
541 1.18 thorpej n = n->m_next;
542 1.18 thorpej
543 1.18 thorpej n->m_len = m->m_len;
544 1.18 thorpej if (m->m_flags & M_EXT) {
545 1.18 thorpej n->m_data = m->m_data;
546 1.18 thorpej n->m_ext = m->m_ext;
547 1.18 thorpej MCLADDREFERENCE(m, n);
548 1.18 thorpej } else {
549 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
550 1.18 thorpej }
551 1.18 thorpej
552 1.18 thorpej m = m->m_next;
553 1.18 thorpej }
554 1.18 thorpej return top;
555 1.18 thorpej nospace:
556 1.18 thorpej m_freem(top);
557 1.18 thorpej MCFail++;
558 1.18 thorpej return 0;
559 1.18 thorpej }
560 1.18 thorpej
561 1.18 thorpej /*
562 1.1 cgd * Copy data from an mbuf chain starting "off" bytes from the beginning,
563 1.1 cgd * continuing for "len" bytes, into the indicated buffer.
564 1.1 cgd */
565 1.14 christos void
566 1.1 cgd m_copydata(m, off, len, cp)
567 1.27 matt struct mbuf *m;
568 1.27 matt int off;
569 1.27 matt int len;
570 1.1 cgd caddr_t cp;
571 1.1 cgd {
572 1.27 matt unsigned count;
573 1.1 cgd
574 1.1 cgd if (off < 0 || len < 0)
575 1.1 cgd panic("m_copydata");
576 1.1 cgd while (off > 0) {
577 1.1 cgd if (m == 0)
578 1.1 cgd panic("m_copydata");
579 1.1 cgd if (off < m->m_len)
580 1.1 cgd break;
581 1.1 cgd off -= m->m_len;
582 1.1 cgd m = m->m_next;
583 1.1 cgd }
584 1.1 cgd while (len > 0) {
585 1.1 cgd if (m == 0)
586 1.1 cgd panic("m_copydata");
587 1.9 mycroft count = min(m->m_len - off, len);
588 1.30 perry memcpy(cp, mtod(m, caddr_t) + off, count);
589 1.1 cgd len -= count;
590 1.1 cgd cp += count;
591 1.1 cgd off = 0;
592 1.1 cgd m = m->m_next;
593 1.1 cgd }
594 1.1 cgd }
595 1.1 cgd
596 1.1 cgd /*
597 1.1 cgd * Concatenate mbuf chain n to m.
598 1.1 cgd * Both chains must be of the same type (e.g. MT_DATA).
599 1.1 cgd * Any m_pkthdr is not updated.
600 1.1 cgd */
601 1.14 christos void
602 1.1 cgd m_cat(m, n)
603 1.27 matt struct mbuf *m, *n;
604 1.1 cgd {
605 1.1 cgd while (m->m_next)
606 1.1 cgd m = m->m_next;
607 1.1 cgd while (n) {
608 1.1 cgd if (m->m_flags & M_EXT ||
609 1.1 cgd m->m_data + m->m_len + n->m_len >= &m->m_dat[MLEN]) {
610 1.1 cgd /* just join the two chains */
611 1.1 cgd m->m_next = n;
612 1.1 cgd return;
613 1.1 cgd }
614 1.1 cgd /* splat the data from one into the other */
615 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
616 1.1 cgd (u_int)n->m_len);
617 1.1 cgd m->m_len += n->m_len;
618 1.1 cgd n = m_free(n);
619 1.1 cgd }
620 1.1 cgd }
621 1.1 cgd
622 1.11 mycroft void
623 1.1 cgd m_adj(mp, req_len)
624 1.1 cgd struct mbuf *mp;
625 1.8 deraadt int req_len;
626 1.1 cgd {
627 1.27 matt int len = req_len;
628 1.27 matt struct mbuf *m;
629 1.27 matt int count;
630 1.1 cgd
631 1.1 cgd if ((m = mp) == NULL)
632 1.1 cgd return;
633 1.1 cgd if (len >= 0) {
634 1.1 cgd /*
635 1.1 cgd * Trim from head.
636 1.1 cgd */
637 1.1 cgd while (m != NULL && len > 0) {
638 1.1 cgd if (m->m_len <= len) {
639 1.1 cgd len -= m->m_len;
640 1.1 cgd m->m_len = 0;
641 1.1 cgd m = m->m_next;
642 1.1 cgd } else {
643 1.1 cgd m->m_len -= len;
644 1.1 cgd m->m_data += len;
645 1.1 cgd len = 0;
646 1.1 cgd }
647 1.1 cgd }
648 1.1 cgd m = mp;
649 1.1 cgd if (mp->m_flags & M_PKTHDR)
650 1.1 cgd m->m_pkthdr.len -= (req_len - len);
651 1.1 cgd } else {
652 1.1 cgd /*
653 1.1 cgd * Trim from tail. Scan the mbuf chain,
654 1.1 cgd * calculating its length and finding the last mbuf.
655 1.1 cgd * If the adjustment only affects this mbuf, then just
656 1.1 cgd * adjust and return. Otherwise, rescan and truncate
657 1.1 cgd * after the remaining size.
658 1.1 cgd */
659 1.1 cgd len = -len;
660 1.1 cgd count = 0;
661 1.1 cgd for (;;) {
662 1.1 cgd count += m->m_len;
663 1.1 cgd if (m->m_next == (struct mbuf *)0)
664 1.1 cgd break;
665 1.1 cgd m = m->m_next;
666 1.1 cgd }
667 1.1 cgd if (m->m_len >= len) {
668 1.1 cgd m->m_len -= len;
669 1.8 deraadt if (mp->m_flags & M_PKTHDR)
670 1.8 deraadt mp->m_pkthdr.len -= len;
671 1.1 cgd return;
672 1.1 cgd }
673 1.1 cgd count -= len;
674 1.1 cgd if (count < 0)
675 1.1 cgd count = 0;
676 1.1 cgd /*
677 1.1 cgd * Correct length for chain is "count".
678 1.1 cgd * Find the mbuf with last data, adjust its length,
679 1.1 cgd * and toss data from remaining mbufs on chain.
680 1.1 cgd */
681 1.1 cgd m = mp;
682 1.1 cgd if (m->m_flags & M_PKTHDR)
683 1.1 cgd m->m_pkthdr.len = count;
684 1.1 cgd for (; m; m = m->m_next) {
685 1.1 cgd if (m->m_len >= count) {
686 1.1 cgd m->m_len = count;
687 1.1 cgd break;
688 1.1 cgd }
689 1.1 cgd count -= m->m_len;
690 1.1 cgd }
691 1.18 thorpej while (m->m_next)
692 1.18 thorpej (m = m->m_next) ->m_len = 0;
693 1.1 cgd }
694 1.1 cgd }
695 1.1 cgd
696 1.1 cgd /*
697 1.1 cgd * Rearange an mbuf chain so that len bytes are contiguous
698 1.1 cgd * and in the data area of an mbuf (so that mtod and dtom
699 1.1 cgd * will work for a structure of size len). Returns the resulting
700 1.1 cgd * mbuf chain on success, frees it and returns null on failure.
701 1.1 cgd * If there is room, it will add up to max_protohdr-len extra bytes to the
702 1.1 cgd * contiguous region in an attempt to avoid being called next time.
703 1.1 cgd */
704 1.1 cgd int MPFail;
705 1.1 cgd
706 1.1 cgd struct mbuf *
707 1.1 cgd m_pullup(n, len)
708 1.27 matt struct mbuf *n;
709 1.1 cgd int len;
710 1.1 cgd {
711 1.27 matt struct mbuf *m;
712 1.27 matt int count;
713 1.1 cgd int space;
714 1.1 cgd
715 1.1 cgd /*
716 1.1 cgd * If first mbuf has no cluster, and has room for len bytes
717 1.1 cgd * without shifting current data, pullup into it,
718 1.1 cgd * otherwise allocate a new mbuf to prepend to the chain.
719 1.1 cgd */
720 1.1 cgd if ((n->m_flags & M_EXT) == 0 &&
721 1.1 cgd n->m_data + len < &n->m_dat[MLEN] && n->m_next) {
722 1.1 cgd if (n->m_len >= len)
723 1.1 cgd return (n);
724 1.1 cgd m = n;
725 1.1 cgd n = n->m_next;
726 1.1 cgd len -= m->m_len;
727 1.1 cgd } else {
728 1.1 cgd if (len > MHLEN)
729 1.1 cgd goto bad;
730 1.1 cgd MGET(m, M_DONTWAIT, n->m_type);
731 1.1 cgd if (m == 0)
732 1.1 cgd goto bad;
733 1.1 cgd m->m_len = 0;
734 1.1 cgd if (n->m_flags & M_PKTHDR) {
735 1.1 cgd M_COPY_PKTHDR(m, n);
736 1.1 cgd n->m_flags &= ~M_PKTHDR;
737 1.1 cgd }
738 1.1 cgd }
739 1.1 cgd space = &m->m_dat[MLEN] - (m->m_data + m->m_len);
740 1.1 cgd do {
741 1.1 cgd count = min(min(max(len, max_protohdr), space), n->m_len);
742 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
743 1.1 cgd (unsigned)count);
744 1.1 cgd len -= count;
745 1.1 cgd m->m_len += count;
746 1.1 cgd n->m_len -= count;
747 1.1 cgd space -= count;
748 1.1 cgd if (n->m_len)
749 1.1 cgd n->m_data += count;
750 1.1 cgd else
751 1.1 cgd n = m_free(n);
752 1.1 cgd } while (len > 0 && n);
753 1.1 cgd if (len > 0) {
754 1.1 cgd (void) m_free(m);
755 1.1 cgd goto bad;
756 1.1 cgd }
757 1.1 cgd m->m_next = n;
758 1.1 cgd return (m);
759 1.1 cgd bad:
760 1.1 cgd m_freem(n);
761 1.1 cgd MPFail++;
762 1.1 cgd return (0);
763 1.9 mycroft }
764 1.9 mycroft
765 1.9 mycroft /*
766 1.9 mycroft * Partition an mbuf chain in two pieces, returning the tail --
767 1.9 mycroft * all but the first len0 bytes. In case of failure, it returns NULL and
768 1.9 mycroft * attempts to restore the chain to its original state.
769 1.9 mycroft */
770 1.9 mycroft struct mbuf *
771 1.9 mycroft m_split(m0, len0, wait)
772 1.27 matt struct mbuf *m0;
773 1.9 mycroft int len0, wait;
774 1.9 mycroft {
775 1.27 matt struct mbuf *m, *n;
776 1.22 thorpej unsigned len = len0, remain, len_save;
777 1.9 mycroft
778 1.9 mycroft for (m = m0; m && len > m->m_len; m = m->m_next)
779 1.9 mycroft len -= m->m_len;
780 1.9 mycroft if (m == 0)
781 1.9 mycroft return (0);
782 1.9 mycroft remain = m->m_len - len;
783 1.9 mycroft if (m0->m_flags & M_PKTHDR) {
784 1.9 mycroft MGETHDR(n, wait, m0->m_type);
785 1.9 mycroft if (n == 0)
786 1.9 mycroft return (0);
787 1.9 mycroft n->m_pkthdr.rcvif = m0->m_pkthdr.rcvif;
788 1.9 mycroft n->m_pkthdr.len = m0->m_pkthdr.len - len0;
789 1.22 thorpej len_save = m0->m_pkthdr.len;
790 1.9 mycroft m0->m_pkthdr.len = len0;
791 1.9 mycroft if (m->m_flags & M_EXT)
792 1.9 mycroft goto extpacket;
793 1.9 mycroft if (remain > MHLEN) {
794 1.9 mycroft /* m can't be the lead packet */
795 1.9 mycroft MH_ALIGN(n, 0);
796 1.9 mycroft n->m_next = m_split(m, len, wait);
797 1.9 mycroft if (n->m_next == 0) {
798 1.9 mycroft (void) m_free(n);
799 1.22 thorpej m0->m_pkthdr.len = len_save;
800 1.9 mycroft return (0);
801 1.9 mycroft } else
802 1.9 mycroft return (n);
803 1.9 mycroft } else
804 1.9 mycroft MH_ALIGN(n, remain);
805 1.9 mycroft } else if (remain == 0) {
806 1.9 mycroft n = m->m_next;
807 1.9 mycroft m->m_next = 0;
808 1.9 mycroft return (n);
809 1.9 mycroft } else {
810 1.9 mycroft MGET(n, wait, m->m_type);
811 1.9 mycroft if (n == 0)
812 1.9 mycroft return (0);
813 1.9 mycroft M_ALIGN(n, remain);
814 1.9 mycroft }
815 1.9 mycroft extpacket:
816 1.9 mycroft if (m->m_flags & M_EXT) {
817 1.9 mycroft n->m_ext = m->m_ext;
818 1.18 thorpej MCLADDREFERENCE(m, n);
819 1.9 mycroft n->m_data = m->m_data + len;
820 1.9 mycroft } else {
821 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + len, remain);
822 1.9 mycroft }
823 1.9 mycroft n->m_len = remain;
824 1.9 mycroft m->m_len = len;
825 1.9 mycroft n->m_next = m->m_next;
826 1.9 mycroft m->m_next = 0;
827 1.9 mycroft return (n);
828 1.9 mycroft }
829 1.9 mycroft /*
830 1.9 mycroft * Routine to copy from device local memory into mbufs.
831 1.9 mycroft */
832 1.9 mycroft struct mbuf *
833 1.9 mycroft m_devget(buf, totlen, off0, ifp, copy)
834 1.9 mycroft char *buf;
835 1.9 mycroft int totlen, off0;
836 1.9 mycroft struct ifnet *ifp;
837 1.18 thorpej void (*copy) __P((const void *from, void *to, size_t len));
838 1.9 mycroft {
839 1.27 matt struct mbuf *m;
840 1.9 mycroft struct mbuf *top = 0, **mp = ⊤
841 1.27 matt int off = off0, len;
842 1.27 matt char *cp;
843 1.9 mycroft char *epkt;
844 1.9 mycroft
845 1.9 mycroft cp = buf;
846 1.9 mycroft epkt = cp + totlen;
847 1.9 mycroft if (off) {
848 1.13 cgd /*
849 1.13 cgd * If 'off' is non-zero, packet is trailer-encapsulated,
850 1.13 cgd * so we have to skip the type and length fields.
851 1.13 cgd */
852 1.13 cgd cp += off + 2 * sizeof(u_int16_t);
853 1.13 cgd totlen -= 2 * sizeof(u_int16_t);
854 1.9 mycroft }
855 1.9 mycroft MGETHDR(m, M_DONTWAIT, MT_DATA);
856 1.9 mycroft if (m == 0)
857 1.9 mycroft return (0);
858 1.9 mycroft m->m_pkthdr.rcvif = ifp;
859 1.9 mycroft m->m_pkthdr.len = totlen;
860 1.9 mycroft m->m_len = MHLEN;
861 1.9 mycroft
862 1.9 mycroft while (totlen > 0) {
863 1.9 mycroft if (top) {
864 1.9 mycroft MGET(m, M_DONTWAIT, MT_DATA);
865 1.9 mycroft if (m == 0) {
866 1.9 mycroft m_freem(top);
867 1.9 mycroft return (0);
868 1.9 mycroft }
869 1.9 mycroft m->m_len = MLEN;
870 1.9 mycroft }
871 1.9 mycroft len = min(totlen, epkt - cp);
872 1.9 mycroft if (len >= MINCLSIZE) {
873 1.9 mycroft MCLGET(m, M_DONTWAIT);
874 1.19 mycroft if ((m->m_flags & M_EXT) == 0) {
875 1.20 mycroft m_free(m);
876 1.19 mycroft m_freem(top);
877 1.19 mycroft return (0);
878 1.19 mycroft }
879 1.19 mycroft m->m_len = len = min(len, MCLBYTES);
880 1.9 mycroft } else {
881 1.9 mycroft /*
882 1.9 mycroft * Place initial small packet/header at end of mbuf.
883 1.9 mycroft */
884 1.9 mycroft if (len < m->m_len) {
885 1.9 mycroft if (top == 0 && len + max_linkhdr <= m->m_len)
886 1.9 mycroft m->m_data += max_linkhdr;
887 1.9 mycroft m->m_len = len;
888 1.9 mycroft } else
889 1.9 mycroft len = m->m_len;
890 1.9 mycroft }
891 1.9 mycroft if (copy)
892 1.14 christos copy(cp, mtod(m, caddr_t), (size_t)len);
893 1.9 mycroft else
894 1.30 perry memcpy(mtod(m, caddr_t), cp, (size_t)len);
895 1.9 mycroft cp += len;
896 1.9 mycroft *mp = m;
897 1.9 mycroft mp = &m->m_next;
898 1.9 mycroft totlen -= len;
899 1.9 mycroft if (cp == epkt)
900 1.9 mycroft cp = buf;
901 1.9 mycroft }
902 1.9 mycroft return (top);
903 1.18 thorpej }
904 1.18 thorpej
905 1.18 thorpej /*
906 1.18 thorpej * Copy data from a buffer back into the indicated mbuf chain,
907 1.18 thorpej * starting "off" bytes from the beginning, extending the mbuf
908 1.18 thorpej * chain if necessary.
909 1.18 thorpej */
910 1.18 thorpej void
911 1.18 thorpej m_copyback(m0, off, len, cp)
912 1.18 thorpej struct mbuf *m0;
913 1.27 matt int off;
914 1.27 matt int len;
915 1.18 thorpej caddr_t cp;
916 1.18 thorpej {
917 1.27 matt int mlen;
918 1.27 matt struct mbuf *m = m0, *n;
919 1.18 thorpej int totlen = 0;
920 1.18 thorpej
921 1.18 thorpej if (m0 == 0)
922 1.18 thorpej return;
923 1.18 thorpej while (off > (mlen = m->m_len)) {
924 1.18 thorpej off -= mlen;
925 1.18 thorpej totlen += mlen;
926 1.18 thorpej if (m->m_next == 0) {
927 1.18 thorpej n = m_getclr(M_DONTWAIT, m->m_type);
928 1.18 thorpej if (n == 0)
929 1.18 thorpej goto out;
930 1.18 thorpej n->m_len = min(MLEN, len + off);
931 1.18 thorpej m->m_next = n;
932 1.18 thorpej }
933 1.18 thorpej m = m->m_next;
934 1.18 thorpej }
935 1.18 thorpej while (len > 0) {
936 1.18 thorpej mlen = min (m->m_len - off, len);
937 1.30 perry memcpy(mtod(m, caddr_t) + off, cp, (unsigned)mlen);
938 1.18 thorpej cp += mlen;
939 1.18 thorpej len -= mlen;
940 1.18 thorpej mlen += off;
941 1.18 thorpej off = 0;
942 1.18 thorpej totlen += mlen;
943 1.18 thorpej if (len == 0)
944 1.18 thorpej break;
945 1.18 thorpej if (m->m_next == 0) {
946 1.18 thorpej n = m_get(M_DONTWAIT, m->m_type);
947 1.18 thorpej if (n == 0)
948 1.18 thorpej break;
949 1.18 thorpej n->m_len = min(MLEN, len);
950 1.18 thorpej m->m_next = n;
951 1.18 thorpej }
952 1.18 thorpej m = m->m_next;
953 1.18 thorpej }
954 1.18 thorpej out: if (((m = m0)->m_flags & M_PKTHDR) && (m->m_pkthdr.len < totlen))
955 1.18 thorpej m->m_pkthdr.len = totlen;
956 1.1 cgd }
957