uipc_mbuf.c revision 1.52 1 1.52 thorpej /* $NetBSD: uipc_mbuf.c,v 1.52 2001/01/14 02:06:22 thorpej Exp $ */
2 1.42 thorpej
3 1.42 thorpej /*-
4 1.42 thorpej * Copyright (c) 1999 The NetBSD Foundation, Inc.
5 1.42 thorpej * All rights reserved.
6 1.42 thorpej *
7 1.42 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.42 thorpej * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
9 1.42 thorpej * NASA Ames Research Center.
10 1.42 thorpej *
11 1.42 thorpej * Redistribution and use in source and binary forms, with or without
12 1.42 thorpej * modification, are permitted provided that the following conditions
13 1.42 thorpej * are met:
14 1.42 thorpej * 1. Redistributions of source code must retain the above copyright
15 1.42 thorpej * notice, this list of conditions and the following disclaimer.
16 1.42 thorpej * 2. Redistributions in binary form must reproduce the above copyright
17 1.42 thorpej * notice, this list of conditions and the following disclaimer in the
18 1.42 thorpej * documentation and/or other materials provided with the distribution.
19 1.42 thorpej * 3. All advertising materials mentioning features or use of this software
20 1.42 thorpej * must display the following acknowledgement:
21 1.42 thorpej * This product includes software developed by the NetBSD
22 1.42 thorpej * Foundation, Inc. and its contributors.
23 1.42 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
24 1.42 thorpej * contributors may be used to endorse or promote products derived
25 1.42 thorpej * from this software without specific prior written permission.
26 1.42 thorpej *
27 1.42 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
28 1.42 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
29 1.42 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
30 1.42 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
31 1.42 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 1.42 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 1.42 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 1.42 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 1.42 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 1.42 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 1.42 thorpej * POSSIBILITY OF SUCH DAMAGE.
38 1.42 thorpej */
39 1.10 cgd
40 1.1 cgd /*
41 1.9 mycroft * Copyright (c) 1982, 1986, 1988, 1991, 1993
42 1.9 mycroft * The Regents of the University of California. All rights reserved.
43 1.1 cgd *
44 1.1 cgd * Redistribution and use in source and binary forms, with or without
45 1.1 cgd * modification, are permitted provided that the following conditions
46 1.1 cgd * are met:
47 1.1 cgd * 1. Redistributions of source code must retain the above copyright
48 1.1 cgd * notice, this list of conditions and the following disclaimer.
49 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
50 1.1 cgd * notice, this list of conditions and the following disclaimer in the
51 1.1 cgd * documentation and/or other materials provided with the distribution.
52 1.1 cgd * 3. All advertising materials mentioning features or use of this software
53 1.1 cgd * must display the following acknowledgement:
54 1.1 cgd * This product includes software developed by the University of
55 1.1 cgd * California, Berkeley and its contributors.
56 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
57 1.1 cgd * may be used to endorse or promote products derived from this software
58 1.1 cgd * without specific prior written permission.
59 1.1 cgd *
60 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
61 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
62 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
63 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
64 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
65 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
66 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
67 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
68 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
69 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
70 1.1 cgd * SUCH DAMAGE.
71 1.1 cgd *
72 1.26 fvdl * @(#)uipc_mbuf.c 8.4 (Berkeley) 2/14/95
73 1.1 cgd */
74 1.24 mrg
75 1.6 mycroft #include <sys/param.h>
76 1.6 mycroft #include <sys/systm.h>
77 1.6 mycroft #include <sys/proc.h>
78 1.6 mycroft #include <sys/malloc.h>
79 1.9 mycroft #include <sys/map.h>
80 1.1 cgd #define MBTYPES
81 1.6 mycroft #include <sys/mbuf.h>
82 1.6 mycroft #include <sys/kernel.h>
83 1.6 mycroft #include <sys/syslog.h>
84 1.6 mycroft #include <sys/domain.h>
85 1.6 mycroft #include <sys/protosw.h>
86 1.28 thorpej #include <sys/pool.h>
87 1.27 matt #include <sys/socket.h>
88 1.27 matt #include <net/if.h>
89 1.14 christos
90 1.23 mrg #include <uvm/uvm_extern.h>
91 1.23 mrg
92 1.42 thorpej #include <sys/sysctl.h>
93 1.42 thorpej
94 1.28 thorpej struct pool mbpool; /* mbuf pool */
95 1.28 thorpej struct pool mclpool; /* mbuf cluster pool */
96 1.28 thorpej
97 1.18 thorpej struct mbstat mbstat;
98 1.18 thorpej int max_linkhdr;
99 1.18 thorpej int max_protohdr;
100 1.18 thorpej int max_hdr;
101 1.18 thorpej int max_datalen;
102 1.18 thorpej
103 1.28 thorpej void *mclpool_alloc __P((unsigned long, int, int));
104 1.28 thorpej void mclpool_release __P((void *, unsigned long, int));
105 1.44 itojun static struct mbuf *m_copym0 __P((struct mbuf *, int, int, int, int));
106 1.28 thorpej
107 1.42 thorpej const char *mclpool_warnmsg =
108 1.42 thorpej "WARNING: mclpool limit reached; increase NMBCLUSTERS";
109 1.42 thorpej
110 1.28 thorpej /*
111 1.40 thorpej * Initialize the mbuf allcator.
112 1.28 thorpej */
113 1.4 jtc void
114 1.1 cgd mbinit()
115 1.1 cgd {
116 1.1 cgd
117 1.42 thorpej pool_init(&mbpool, msize, 0, 0, 0, "mbpl", 0, NULL, NULL, 0);
118 1.42 thorpej pool_init(&mclpool, mclbytes, 0, 0, 0, "mclpl", 0, mclpool_alloc,
119 1.28 thorpej mclpool_release, 0);
120 1.37 thorpej
121 1.37 thorpej /*
122 1.39 thorpej * Set the hard limit on the mclpool to the number of
123 1.39 thorpej * mbuf clusters the kernel is to support. Log the limit
124 1.39 thorpej * reached message max once a minute.
125 1.39 thorpej */
126 1.42 thorpej pool_sethardlimit(&mclpool, nmbclusters, mclpool_warnmsg, 60);
127 1.42 thorpej
128 1.39 thorpej /*
129 1.42 thorpej * Set a low water mark for both mbufs and clusters. This should
130 1.42 thorpej * help ensure that they can be allocated in a memory starvation
131 1.42 thorpej * situation. This is important for e.g. diskless systems which
132 1.42 thorpej * must allocate mbufs in order for the pagedaemon to clean pages.
133 1.37 thorpej */
134 1.42 thorpej pool_setlowat(&mbpool, mblowat);
135 1.42 thorpej pool_setlowat(&mclpool, mcllowat);
136 1.42 thorpej }
137 1.42 thorpej
138 1.42 thorpej int
139 1.42 thorpej sysctl_dombuf(name, namelen, oldp, oldlenp, newp, newlen)
140 1.42 thorpej int *name;
141 1.42 thorpej u_int namelen;
142 1.42 thorpej void *oldp;
143 1.42 thorpej size_t *oldlenp;
144 1.42 thorpej void *newp;
145 1.42 thorpej size_t newlen;
146 1.42 thorpej {
147 1.42 thorpej int error, newval;
148 1.42 thorpej
149 1.42 thorpej /* All sysctl names at this level are terminal. */
150 1.42 thorpej if (namelen != 1)
151 1.42 thorpej return (ENOTDIR); /* overloaded */
152 1.42 thorpej
153 1.42 thorpej switch (name[0]) {
154 1.42 thorpej case MBUF_MSIZE:
155 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, msize));
156 1.42 thorpej case MBUF_MCLBYTES:
157 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, mclbytes));
158 1.42 thorpej case MBUF_NMBCLUSTERS:
159 1.42 thorpej /*
160 1.42 thorpej * If we have direct-mapped pool pages, we can adjust this
161 1.42 thorpej * number on the fly. If not, we're limited by the size
162 1.42 thorpej * of mb_map, and cannot change this value.
163 1.42 thorpej *
164 1.42 thorpej * Note: we only allow the value to be increased, never
165 1.42 thorpej * decreased.
166 1.42 thorpej */
167 1.42 thorpej if (mb_map == NULL) {
168 1.42 thorpej newval = nmbclusters;
169 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen,
170 1.42 thorpej &newval);
171 1.42 thorpej if (error != 0)
172 1.42 thorpej return (error);
173 1.42 thorpej if (newp != NULL) {
174 1.42 thorpej if (newval >= nmbclusters) {
175 1.42 thorpej nmbclusters = newval;
176 1.42 thorpej pool_sethardlimit(&mclpool,
177 1.42 thorpej nmbclusters, mclpool_warnmsg, 60);
178 1.42 thorpej } else
179 1.42 thorpej error = EINVAL;
180 1.42 thorpej }
181 1.42 thorpej return (error);
182 1.42 thorpej } else
183 1.42 thorpej return (sysctl_rdint(oldp, oldlenp, newp, nmbclusters));
184 1.42 thorpej case MBUF_MBLOWAT:
185 1.42 thorpej case MBUF_MCLLOWAT:
186 1.42 thorpej /* New value must be >= 0. */
187 1.42 thorpej newval = (name[0] == MBUF_MBLOWAT) ? mblowat : mcllowat;
188 1.42 thorpej error = sysctl_int(oldp, oldlenp, newp, newlen, &newval);
189 1.42 thorpej if (error != 0)
190 1.42 thorpej return (error);
191 1.42 thorpej if (newp != NULL) {
192 1.42 thorpej if (newval >= 0) {
193 1.42 thorpej if (name[0] == MBUF_MBLOWAT) {
194 1.42 thorpej mblowat = newval;
195 1.42 thorpej pool_setlowat(&mbpool, newval);
196 1.42 thorpej } else {
197 1.42 thorpej mcllowat = newval;
198 1.42 thorpej pool_setlowat(&mclpool, newval);
199 1.42 thorpej }
200 1.42 thorpej } else
201 1.42 thorpej error = EINVAL;
202 1.42 thorpej }
203 1.42 thorpej return (error);
204 1.42 thorpej default:
205 1.42 thorpej return (EOPNOTSUPP);
206 1.42 thorpej }
207 1.42 thorpej /* NOTREACHED */
208 1.28 thorpej }
209 1.28 thorpej
210 1.28 thorpej void *
211 1.28 thorpej mclpool_alloc(sz, flags, mtype)
212 1.28 thorpej unsigned long sz;
213 1.28 thorpej int flags;
214 1.28 thorpej int mtype;
215 1.28 thorpej {
216 1.32 thorpej boolean_t waitok = (flags & PR_WAITOK) ? TRUE : FALSE;
217 1.28 thorpej
218 1.39 thorpej return ((void *)uvm_km_alloc_poolpage1(mb_map, uvmexp.mb_object,
219 1.39 thorpej waitok));
220 1.1 cgd }
221 1.1 cgd
222 1.28 thorpej void
223 1.28 thorpej mclpool_release(v, sz, mtype)
224 1.28 thorpej void *v;
225 1.28 thorpej unsigned long sz;
226 1.28 thorpej int mtype;
227 1.1 cgd {
228 1.1 cgd
229 1.31 thorpej uvm_km_free_poolpage1(mb_map, (vaddr_t)v);
230 1.1 cgd }
231 1.1 cgd
232 1.1 cgd /*
233 1.1 cgd * When MGET failes, ask protocols to free space when short of memory,
234 1.1 cgd * then re-attempt to allocate an mbuf.
235 1.1 cgd */
236 1.1 cgd struct mbuf *
237 1.1 cgd m_retry(i, t)
238 1.1 cgd int i, t;
239 1.1 cgd {
240 1.27 matt struct mbuf *m;
241 1.1 cgd
242 1.29 thorpej m_reclaim(i);
243 1.1 cgd #define m_retry(i, t) (struct mbuf *)0
244 1.1 cgd MGET(m, i, t);
245 1.1 cgd #undef m_retry
246 1.18 thorpej if (m != NULL)
247 1.18 thorpej mbstat.m_wait++;
248 1.18 thorpej else
249 1.18 thorpej mbstat.m_drops++;
250 1.1 cgd return (m);
251 1.1 cgd }
252 1.1 cgd
253 1.1 cgd /*
254 1.1 cgd * As above; retry an MGETHDR.
255 1.1 cgd */
256 1.1 cgd struct mbuf *
257 1.1 cgd m_retryhdr(i, t)
258 1.1 cgd int i, t;
259 1.1 cgd {
260 1.27 matt struct mbuf *m;
261 1.1 cgd
262 1.29 thorpej m_reclaim(i);
263 1.1 cgd #define m_retryhdr(i, t) (struct mbuf *)0
264 1.1 cgd MGETHDR(m, i, t);
265 1.1 cgd #undef m_retryhdr
266 1.18 thorpej if (m != NULL)
267 1.18 thorpej mbstat.m_wait++;
268 1.18 thorpej else
269 1.18 thorpej mbstat.m_drops++;
270 1.1 cgd return (m);
271 1.1 cgd }
272 1.1 cgd
273 1.14 christos void
274 1.29 thorpej m_reclaim(how)
275 1.29 thorpej int how;
276 1.1 cgd {
277 1.27 matt struct domain *dp;
278 1.27 matt struct protosw *pr;
279 1.27 matt struct ifnet *ifp;
280 1.52 thorpej int s = splvm();
281 1.1 cgd
282 1.33 thorpej for (dp = domains; dp; dp = dp->dom_next)
283 1.33 thorpej for (pr = dp->dom_protosw;
284 1.33 thorpej pr < dp->dom_protoswNPROTOSW; pr++)
285 1.33 thorpej if (pr->pr_drain)
286 1.33 thorpej (*pr->pr_drain)();
287 1.27 matt for (ifp = TAILQ_FIRST(&ifnet); ifp; ifp = TAILQ_NEXT(ifp, if_list))
288 1.27 matt if (ifp->if_drain)
289 1.27 matt (*ifp->if_drain)(ifp);
290 1.1 cgd splx(s);
291 1.1 cgd mbstat.m_drain++;
292 1.1 cgd }
293 1.1 cgd
294 1.1 cgd /*
295 1.1 cgd * Space allocation routines.
296 1.1 cgd * These are also available as macros
297 1.1 cgd * for critical paths.
298 1.1 cgd */
299 1.1 cgd struct mbuf *
300 1.5 cgd m_get(nowait, type)
301 1.5 cgd int nowait, type;
302 1.1 cgd {
303 1.27 matt struct mbuf *m;
304 1.1 cgd
305 1.5 cgd MGET(m, nowait, type);
306 1.1 cgd return (m);
307 1.1 cgd }
308 1.1 cgd
309 1.1 cgd struct mbuf *
310 1.5 cgd m_gethdr(nowait, type)
311 1.5 cgd int nowait, type;
312 1.1 cgd {
313 1.27 matt struct mbuf *m;
314 1.1 cgd
315 1.5 cgd MGETHDR(m, nowait, type);
316 1.1 cgd return (m);
317 1.1 cgd }
318 1.1 cgd
319 1.1 cgd struct mbuf *
320 1.5 cgd m_getclr(nowait, type)
321 1.5 cgd int nowait, type;
322 1.1 cgd {
323 1.27 matt struct mbuf *m;
324 1.1 cgd
325 1.5 cgd MGET(m, nowait, type);
326 1.1 cgd if (m == 0)
327 1.1 cgd return (0);
328 1.30 perry memset(mtod(m, caddr_t), 0, MLEN);
329 1.1 cgd return (m);
330 1.1 cgd }
331 1.1 cgd
332 1.1 cgd struct mbuf *
333 1.1 cgd m_free(m)
334 1.1 cgd struct mbuf *m;
335 1.1 cgd {
336 1.27 matt struct mbuf *n;
337 1.1 cgd
338 1.1 cgd MFREE(m, n);
339 1.1 cgd return (n);
340 1.1 cgd }
341 1.1 cgd
342 1.9 mycroft void
343 1.1 cgd m_freem(m)
344 1.27 matt struct mbuf *m;
345 1.1 cgd {
346 1.27 matt struct mbuf *n;
347 1.1 cgd
348 1.1 cgd if (m == NULL)
349 1.1 cgd return;
350 1.1 cgd do {
351 1.1 cgd MFREE(m, n);
352 1.18 thorpej m = n;
353 1.18 thorpej } while (m);
354 1.1 cgd }
355 1.1 cgd
356 1.1 cgd /*
357 1.1 cgd * Mbuffer utility routines.
358 1.1 cgd */
359 1.1 cgd
360 1.1 cgd /*
361 1.1 cgd * Lesser-used path for M_PREPEND:
362 1.1 cgd * allocate new mbuf to prepend to chain,
363 1.1 cgd * copy junk along.
364 1.1 cgd */
365 1.1 cgd struct mbuf *
366 1.9 mycroft m_prepend(m, len, how)
367 1.27 matt struct mbuf *m;
368 1.9 mycroft int len, how;
369 1.1 cgd {
370 1.1 cgd struct mbuf *mn;
371 1.1 cgd
372 1.9 mycroft MGET(mn, how, m->m_type);
373 1.1 cgd if (mn == (struct mbuf *)NULL) {
374 1.1 cgd m_freem(m);
375 1.1 cgd return ((struct mbuf *)NULL);
376 1.1 cgd }
377 1.1 cgd if (m->m_flags & M_PKTHDR) {
378 1.1 cgd M_COPY_PKTHDR(mn, m);
379 1.1 cgd m->m_flags &= ~M_PKTHDR;
380 1.1 cgd }
381 1.1 cgd mn->m_next = m;
382 1.1 cgd m = mn;
383 1.1 cgd if (len < MHLEN)
384 1.1 cgd MH_ALIGN(m, len);
385 1.1 cgd m->m_len = len;
386 1.1 cgd return (m);
387 1.1 cgd }
388 1.1 cgd
389 1.1 cgd /*
390 1.1 cgd * Make a copy of an mbuf chain starting "off0" bytes from the beginning,
391 1.1 cgd * continuing for "len" bytes. If len is M_COPYALL, copy to end of mbuf.
392 1.1 cgd * The wait parameter is a choice of M_WAIT/M_DONTWAIT from caller.
393 1.1 cgd */
394 1.1 cgd int MCFail;
395 1.1 cgd
396 1.1 cgd struct mbuf *
397 1.1 cgd m_copym(m, off0, len, wait)
398 1.27 matt struct mbuf *m;
399 1.1 cgd int off0, wait;
400 1.27 matt int len;
401 1.1 cgd {
402 1.44 itojun return m_copym0(m, off0, len, wait, 0); /* shallow copy on M_EXT */
403 1.44 itojun }
404 1.44 itojun
405 1.44 itojun struct mbuf *
406 1.44 itojun m_dup(m, off0, len, wait)
407 1.44 itojun struct mbuf *m;
408 1.44 itojun int off0, wait;
409 1.44 itojun int len;
410 1.44 itojun {
411 1.44 itojun return m_copym0(m, off0, len, wait, 1); /* deep copy */
412 1.44 itojun }
413 1.44 itojun
414 1.44 itojun static struct mbuf *
415 1.44 itojun m_copym0(m, off0, len, wait, deep)
416 1.44 itojun struct mbuf *m;
417 1.44 itojun int off0, wait;
418 1.44 itojun int len;
419 1.44 itojun int deep; /* deep copy */
420 1.44 itojun {
421 1.27 matt struct mbuf *n, **np;
422 1.27 matt int off = off0;
423 1.1 cgd struct mbuf *top;
424 1.1 cgd int copyhdr = 0;
425 1.1 cgd
426 1.1 cgd if (off < 0 || len < 0)
427 1.43 thorpej panic("m_copym: off %d, len %d", off, len);
428 1.1 cgd if (off == 0 && m->m_flags & M_PKTHDR)
429 1.1 cgd copyhdr = 1;
430 1.1 cgd while (off > 0) {
431 1.1 cgd if (m == 0)
432 1.43 thorpej panic("m_copym: m == 0");
433 1.1 cgd if (off < m->m_len)
434 1.1 cgd break;
435 1.1 cgd off -= m->m_len;
436 1.1 cgd m = m->m_next;
437 1.1 cgd }
438 1.1 cgd np = ⊤
439 1.1 cgd top = 0;
440 1.1 cgd while (len > 0) {
441 1.1 cgd if (m == 0) {
442 1.1 cgd if (len != M_COPYALL)
443 1.43 thorpej panic("m_copym: m == 0 and not COPYALL");
444 1.1 cgd break;
445 1.1 cgd }
446 1.1 cgd MGET(n, wait, m->m_type);
447 1.1 cgd *np = n;
448 1.1 cgd if (n == 0)
449 1.1 cgd goto nospace;
450 1.1 cgd if (copyhdr) {
451 1.1 cgd M_COPY_PKTHDR(n, m);
452 1.1 cgd if (len == M_COPYALL)
453 1.1 cgd n->m_pkthdr.len -= off0;
454 1.1 cgd else
455 1.1 cgd n->m_pkthdr.len = len;
456 1.1 cgd copyhdr = 0;
457 1.1 cgd }
458 1.9 mycroft n->m_len = min(len, m->m_len - off);
459 1.1 cgd if (m->m_flags & M_EXT) {
460 1.44 itojun if (!deep) {
461 1.44 itojun n->m_data = m->m_data + off;
462 1.44 itojun n->m_ext = m->m_ext;
463 1.44 itojun MCLADDREFERENCE(m, n);
464 1.44 itojun } else {
465 1.48 itojun /*
466 1.50 itojun * we are unsure about the way m was allocated.
467 1.50 itojun * copy into multiple MCLBYTES cluster mbufs.
468 1.48 itojun */
469 1.44 itojun MCLGET(n, wait);
470 1.50 itojun n->m_len = 0;
471 1.50 itojun n->m_len = M_TRAILINGSPACE(n);
472 1.50 itojun n->m_len = min(n->m_len, len);
473 1.50 itojun n->m_len = min(n->m_len, m->m_len - off);
474 1.50 itojun memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + off,
475 1.44 itojun (unsigned)n->m_len);
476 1.44 itojun }
477 1.1 cgd } else
478 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t)+off,
479 1.1 cgd (unsigned)n->m_len);
480 1.1 cgd if (len != M_COPYALL)
481 1.1 cgd len -= n->m_len;
482 1.50 itojun off += n->m_len;
483 1.50 itojun #ifdef DIAGNOSTIC
484 1.50 itojun if (off > m->m_len)
485 1.50 itojun panic("m_copym0 overrun");
486 1.50 itojun #endif
487 1.50 itojun if (off == m->m_len) {
488 1.50 itojun m = m->m_next;
489 1.50 itojun off = 0;
490 1.50 itojun }
491 1.1 cgd np = &n->m_next;
492 1.1 cgd }
493 1.1 cgd if (top == 0)
494 1.1 cgd MCFail++;
495 1.1 cgd return (top);
496 1.1 cgd nospace:
497 1.1 cgd m_freem(top);
498 1.1 cgd MCFail++;
499 1.1 cgd return (0);
500 1.1 cgd }
501 1.1 cgd
502 1.1 cgd /*
503 1.18 thorpej * Copy an entire packet, including header (which must be present).
504 1.18 thorpej * An optimization of the common case `m_copym(m, 0, M_COPYALL, how)'.
505 1.18 thorpej */
506 1.18 thorpej struct mbuf *
507 1.18 thorpej m_copypacket(m, how)
508 1.18 thorpej struct mbuf *m;
509 1.18 thorpej int how;
510 1.18 thorpej {
511 1.18 thorpej struct mbuf *top, *n, *o;
512 1.18 thorpej
513 1.18 thorpej MGET(n, how, m->m_type);
514 1.18 thorpej top = n;
515 1.18 thorpej if (!n)
516 1.18 thorpej goto nospace;
517 1.18 thorpej
518 1.18 thorpej M_COPY_PKTHDR(n, m);
519 1.18 thorpej n->m_len = m->m_len;
520 1.18 thorpej if (m->m_flags & M_EXT) {
521 1.18 thorpej n->m_data = m->m_data;
522 1.18 thorpej n->m_ext = m->m_ext;
523 1.18 thorpej MCLADDREFERENCE(m, n);
524 1.18 thorpej } else {
525 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
526 1.18 thorpej }
527 1.18 thorpej
528 1.18 thorpej m = m->m_next;
529 1.18 thorpej while (m) {
530 1.18 thorpej MGET(o, how, m->m_type);
531 1.18 thorpej if (!o)
532 1.18 thorpej goto nospace;
533 1.18 thorpej
534 1.18 thorpej n->m_next = o;
535 1.18 thorpej n = n->m_next;
536 1.18 thorpej
537 1.18 thorpej n->m_len = m->m_len;
538 1.18 thorpej if (m->m_flags & M_EXT) {
539 1.18 thorpej n->m_data = m->m_data;
540 1.18 thorpej n->m_ext = m->m_ext;
541 1.18 thorpej MCLADDREFERENCE(m, n);
542 1.18 thorpej } else {
543 1.30 perry memcpy(mtod(n, char *), mtod(m, char *), n->m_len);
544 1.18 thorpej }
545 1.18 thorpej
546 1.18 thorpej m = m->m_next;
547 1.18 thorpej }
548 1.18 thorpej return top;
549 1.18 thorpej nospace:
550 1.18 thorpej m_freem(top);
551 1.18 thorpej MCFail++;
552 1.18 thorpej return 0;
553 1.18 thorpej }
554 1.18 thorpej
555 1.18 thorpej /*
556 1.1 cgd * Copy data from an mbuf chain starting "off" bytes from the beginning,
557 1.1 cgd * continuing for "len" bytes, into the indicated buffer.
558 1.1 cgd */
559 1.14 christos void
560 1.1 cgd m_copydata(m, off, len, cp)
561 1.27 matt struct mbuf *m;
562 1.27 matt int off;
563 1.27 matt int len;
564 1.1 cgd caddr_t cp;
565 1.1 cgd {
566 1.27 matt unsigned count;
567 1.1 cgd
568 1.1 cgd if (off < 0 || len < 0)
569 1.1 cgd panic("m_copydata");
570 1.1 cgd while (off > 0) {
571 1.1 cgd if (m == 0)
572 1.1 cgd panic("m_copydata");
573 1.1 cgd if (off < m->m_len)
574 1.1 cgd break;
575 1.1 cgd off -= m->m_len;
576 1.1 cgd m = m->m_next;
577 1.1 cgd }
578 1.1 cgd while (len > 0) {
579 1.1 cgd if (m == 0)
580 1.1 cgd panic("m_copydata");
581 1.9 mycroft count = min(m->m_len - off, len);
582 1.30 perry memcpy(cp, mtod(m, caddr_t) + off, count);
583 1.1 cgd len -= count;
584 1.1 cgd cp += count;
585 1.1 cgd off = 0;
586 1.1 cgd m = m->m_next;
587 1.1 cgd }
588 1.1 cgd }
589 1.1 cgd
590 1.1 cgd /*
591 1.1 cgd * Concatenate mbuf chain n to m.
592 1.1 cgd * Both chains must be of the same type (e.g. MT_DATA).
593 1.1 cgd * Any m_pkthdr is not updated.
594 1.1 cgd */
595 1.14 christos void
596 1.1 cgd m_cat(m, n)
597 1.27 matt struct mbuf *m, *n;
598 1.1 cgd {
599 1.1 cgd while (m->m_next)
600 1.1 cgd m = m->m_next;
601 1.1 cgd while (n) {
602 1.1 cgd if (m->m_flags & M_EXT ||
603 1.1 cgd m->m_data + m->m_len + n->m_len >= &m->m_dat[MLEN]) {
604 1.1 cgd /* just join the two chains */
605 1.1 cgd m->m_next = n;
606 1.1 cgd return;
607 1.1 cgd }
608 1.1 cgd /* splat the data from one into the other */
609 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
610 1.1 cgd (u_int)n->m_len);
611 1.1 cgd m->m_len += n->m_len;
612 1.1 cgd n = m_free(n);
613 1.1 cgd }
614 1.1 cgd }
615 1.1 cgd
616 1.11 mycroft void
617 1.1 cgd m_adj(mp, req_len)
618 1.1 cgd struct mbuf *mp;
619 1.8 deraadt int req_len;
620 1.1 cgd {
621 1.27 matt int len = req_len;
622 1.27 matt struct mbuf *m;
623 1.27 matt int count;
624 1.1 cgd
625 1.1 cgd if ((m = mp) == NULL)
626 1.1 cgd return;
627 1.1 cgd if (len >= 0) {
628 1.1 cgd /*
629 1.1 cgd * Trim from head.
630 1.1 cgd */
631 1.1 cgd while (m != NULL && len > 0) {
632 1.1 cgd if (m->m_len <= len) {
633 1.1 cgd len -= m->m_len;
634 1.1 cgd m->m_len = 0;
635 1.1 cgd m = m->m_next;
636 1.1 cgd } else {
637 1.1 cgd m->m_len -= len;
638 1.1 cgd m->m_data += len;
639 1.1 cgd len = 0;
640 1.1 cgd }
641 1.1 cgd }
642 1.1 cgd m = mp;
643 1.1 cgd if (mp->m_flags & M_PKTHDR)
644 1.1 cgd m->m_pkthdr.len -= (req_len - len);
645 1.1 cgd } else {
646 1.1 cgd /*
647 1.1 cgd * Trim from tail. Scan the mbuf chain,
648 1.1 cgd * calculating its length and finding the last mbuf.
649 1.1 cgd * If the adjustment only affects this mbuf, then just
650 1.1 cgd * adjust and return. Otherwise, rescan and truncate
651 1.1 cgd * after the remaining size.
652 1.1 cgd */
653 1.1 cgd len = -len;
654 1.1 cgd count = 0;
655 1.1 cgd for (;;) {
656 1.1 cgd count += m->m_len;
657 1.1 cgd if (m->m_next == (struct mbuf *)0)
658 1.1 cgd break;
659 1.1 cgd m = m->m_next;
660 1.1 cgd }
661 1.1 cgd if (m->m_len >= len) {
662 1.1 cgd m->m_len -= len;
663 1.8 deraadt if (mp->m_flags & M_PKTHDR)
664 1.8 deraadt mp->m_pkthdr.len -= len;
665 1.1 cgd return;
666 1.1 cgd }
667 1.1 cgd count -= len;
668 1.1 cgd if (count < 0)
669 1.1 cgd count = 0;
670 1.1 cgd /*
671 1.1 cgd * Correct length for chain is "count".
672 1.1 cgd * Find the mbuf with last data, adjust its length,
673 1.1 cgd * and toss data from remaining mbufs on chain.
674 1.1 cgd */
675 1.1 cgd m = mp;
676 1.1 cgd if (m->m_flags & M_PKTHDR)
677 1.1 cgd m->m_pkthdr.len = count;
678 1.1 cgd for (; m; m = m->m_next) {
679 1.1 cgd if (m->m_len >= count) {
680 1.1 cgd m->m_len = count;
681 1.1 cgd break;
682 1.1 cgd }
683 1.1 cgd count -= m->m_len;
684 1.1 cgd }
685 1.18 thorpej while (m->m_next)
686 1.18 thorpej (m = m->m_next) ->m_len = 0;
687 1.1 cgd }
688 1.1 cgd }
689 1.1 cgd
690 1.1 cgd /*
691 1.1 cgd * Rearange an mbuf chain so that len bytes are contiguous
692 1.1 cgd * and in the data area of an mbuf (so that mtod and dtom
693 1.1 cgd * will work for a structure of size len). Returns the resulting
694 1.1 cgd * mbuf chain on success, frees it and returns null on failure.
695 1.1 cgd * If there is room, it will add up to max_protohdr-len extra bytes to the
696 1.1 cgd * contiguous region in an attempt to avoid being called next time.
697 1.1 cgd */
698 1.1 cgd int MPFail;
699 1.1 cgd
700 1.1 cgd struct mbuf *
701 1.1 cgd m_pullup(n, len)
702 1.27 matt struct mbuf *n;
703 1.1 cgd int len;
704 1.1 cgd {
705 1.27 matt struct mbuf *m;
706 1.27 matt int count;
707 1.1 cgd int space;
708 1.1 cgd
709 1.1 cgd /*
710 1.1 cgd * If first mbuf has no cluster, and has room for len bytes
711 1.1 cgd * without shifting current data, pullup into it,
712 1.1 cgd * otherwise allocate a new mbuf to prepend to the chain.
713 1.1 cgd */
714 1.1 cgd if ((n->m_flags & M_EXT) == 0 &&
715 1.1 cgd n->m_data + len < &n->m_dat[MLEN] && n->m_next) {
716 1.1 cgd if (n->m_len >= len)
717 1.1 cgd return (n);
718 1.1 cgd m = n;
719 1.1 cgd n = n->m_next;
720 1.1 cgd len -= m->m_len;
721 1.1 cgd } else {
722 1.1 cgd if (len > MHLEN)
723 1.1 cgd goto bad;
724 1.1 cgd MGET(m, M_DONTWAIT, n->m_type);
725 1.1 cgd if (m == 0)
726 1.1 cgd goto bad;
727 1.1 cgd m->m_len = 0;
728 1.1 cgd if (n->m_flags & M_PKTHDR) {
729 1.1 cgd M_COPY_PKTHDR(m, n);
730 1.1 cgd n->m_flags &= ~M_PKTHDR;
731 1.1 cgd }
732 1.1 cgd }
733 1.1 cgd space = &m->m_dat[MLEN] - (m->m_data + m->m_len);
734 1.1 cgd do {
735 1.1 cgd count = min(min(max(len, max_protohdr), space), n->m_len);
736 1.30 perry memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
737 1.1 cgd (unsigned)count);
738 1.1 cgd len -= count;
739 1.1 cgd m->m_len += count;
740 1.1 cgd n->m_len -= count;
741 1.1 cgd space -= count;
742 1.1 cgd if (n->m_len)
743 1.1 cgd n->m_data += count;
744 1.1 cgd else
745 1.1 cgd n = m_free(n);
746 1.1 cgd } while (len > 0 && n);
747 1.1 cgd if (len > 0) {
748 1.1 cgd (void) m_free(m);
749 1.1 cgd goto bad;
750 1.1 cgd }
751 1.1 cgd m->m_next = n;
752 1.1 cgd return (m);
753 1.1 cgd bad:
754 1.1 cgd m_freem(n);
755 1.1 cgd MPFail++;
756 1.1 cgd return (0);
757 1.9 mycroft }
758 1.9 mycroft
759 1.9 mycroft /*
760 1.9 mycroft * Partition an mbuf chain in two pieces, returning the tail --
761 1.9 mycroft * all but the first len0 bytes. In case of failure, it returns NULL and
762 1.9 mycroft * attempts to restore the chain to its original state.
763 1.9 mycroft */
764 1.9 mycroft struct mbuf *
765 1.9 mycroft m_split(m0, len0, wait)
766 1.27 matt struct mbuf *m0;
767 1.9 mycroft int len0, wait;
768 1.9 mycroft {
769 1.27 matt struct mbuf *m, *n;
770 1.22 thorpej unsigned len = len0, remain, len_save;
771 1.9 mycroft
772 1.9 mycroft for (m = m0; m && len > m->m_len; m = m->m_next)
773 1.9 mycroft len -= m->m_len;
774 1.9 mycroft if (m == 0)
775 1.9 mycroft return (0);
776 1.9 mycroft remain = m->m_len - len;
777 1.9 mycroft if (m0->m_flags & M_PKTHDR) {
778 1.9 mycroft MGETHDR(n, wait, m0->m_type);
779 1.9 mycroft if (n == 0)
780 1.9 mycroft return (0);
781 1.9 mycroft n->m_pkthdr.rcvif = m0->m_pkthdr.rcvif;
782 1.9 mycroft n->m_pkthdr.len = m0->m_pkthdr.len - len0;
783 1.22 thorpej len_save = m0->m_pkthdr.len;
784 1.9 mycroft m0->m_pkthdr.len = len0;
785 1.9 mycroft if (m->m_flags & M_EXT)
786 1.9 mycroft goto extpacket;
787 1.9 mycroft if (remain > MHLEN) {
788 1.9 mycroft /* m can't be the lead packet */
789 1.9 mycroft MH_ALIGN(n, 0);
790 1.9 mycroft n->m_next = m_split(m, len, wait);
791 1.9 mycroft if (n->m_next == 0) {
792 1.9 mycroft (void) m_free(n);
793 1.22 thorpej m0->m_pkthdr.len = len_save;
794 1.9 mycroft return (0);
795 1.9 mycroft } else
796 1.9 mycroft return (n);
797 1.9 mycroft } else
798 1.9 mycroft MH_ALIGN(n, remain);
799 1.9 mycroft } else if (remain == 0) {
800 1.9 mycroft n = m->m_next;
801 1.9 mycroft m->m_next = 0;
802 1.9 mycroft return (n);
803 1.9 mycroft } else {
804 1.9 mycroft MGET(n, wait, m->m_type);
805 1.9 mycroft if (n == 0)
806 1.9 mycroft return (0);
807 1.9 mycroft M_ALIGN(n, remain);
808 1.9 mycroft }
809 1.9 mycroft extpacket:
810 1.9 mycroft if (m->m_flags & M_EXT) {
811 1.9 mycroft n->m_ext = m->m_ext;
812 1.18 thorpej MCLADDREFERENCE(m, n);
813 1.9 mycroft n->m_data = m->m_data + len;
814 1.9 mycroft } else {
815 1.30 perry memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + len, remain);
816 1.9 mycroft }
817 1.9 mycroft n->m_len = remain;
818 1.9 mycroft m->m_len = len;
819 1.9 mycroft n->m_next = m->m_next;
820 1.9 mycroft m->m_next = 0;
821 1.9 mycroft return (n);
822 1.9 mycroft }
823 1.9 mycroft /*
824 1.9 mycroft * Routine to copy from device local memory into mbufs.
825 1.9 mycroft */
826 1.9 mycroft struct mbuf *
827 1.9 mycroft m_devget(buf, totlen, off0, ifp, copy)
828 1.9 mycroft char *buf;
829 1.9 mycroft int totlen, off0;
830 1.9 mycroft struct ifnet *ifp;
831 1.18 thorpej void (*copy) __P((const void *from, void *to, size_t len));
832 1.9 mycroft {
833 1.27 matt struct mbuf *m;
834 1.9 mycroft struct mbuf *top = 0, **mp = ⊤
835 1.27 matt int off = off0, len;
836 1.27 matt char *cp;
837 1.9 mycroft char *epkt;
838 1.9 mycroft
839 1.9 mycroft cp = buf;
840 1.9 mycroft epkt = cp + totlen;
841 1.9 mycroft if (off) {
842 1.13 cgd /*
843 1.13 cgd * If 'off' is non-zero, packet is trailer-encapsulated,
844 1.13 cgd * so we have to skip the type and length fields.
845 1.13 cgd */
846 1.13 cgd cp += off + 2 * sizeof(u_int16_t);
847 1.13 cgd totlen -= 2 * sizeof(u_int16_t);
848 1.9 mycroft }
849 1.9 mycroft MGETHDR(m, M_DONTWAIT, MT_DATA);
850 1.9 mycroft if (m == 0)
851 1.9 mycroft return (0);
852 1.9 mycroft m->m_pkthdr.rcvif = ifp;
853 1.9 mycroft m->m_pkthdr.len = totlen;
854 1.9 mycroft m->m_len = MHLEN;
855 1.9 mycroft
856 1.9 mycroft while (totlen > 0) {
857 1.9 mycroft if (top) {
858 1.9 mycroft MGET(m, M_DONTWAIT, MT_DATA);
859 1.9 mycroft if (m == 0) {
860 1.9 mycroft m_freem(top);
861 1.9 mycroft return (0);
862 1.9 mycroft }
863 1.9 mycroft m->m_len = MLEN;
864 1.9 mycroft }
865 1.9 mycroft len = min(totlen, epkt - cp);
866 1.9 mycroft if (len >= MINCLSIZE) {
867 1.9 mycroft MCLGET(m, M_DONTWAIT);
868 1.19 mycroft if ((m->m_flags & M_EXT) == 0) {
869 1.20 mycroft m_free(m);
870 1.19 mycroft m_freem(top);
871 1.19 mycroft return (0);
872 1.19 mycroft }
873 1.19 mycroft m->m_len = len = min(len, MCLBYTES);
874 1.9 mycroft } else {
875 1.9 mycroft /*
876 1.9 mycroft * Place initial small packet/header at end of mbuf.
877 1.9 mycroft */
878 1.9 mycroft if (len < m->m_len) {
879 1.9 mycroft if (top == 0 && len + max_linkhdr <= m->m_len)
880 1.9 mycroft m->m_data += max_linkhdr;
881 1.9 mycroft m->m_len = len;
882 1.9 mycroft } else
883 1.9 mycroft len = m->m_len;
884 1.9 mycroft }
885 1.9 mycroft if (copy)
886 1.14 christos copy(cp, mtod(m, caddr_t), (size_t)len);
887 1.9 mycroft else
888 1.30 perry memcpy(mtod(m, caddr_t), cp, (size_t)len);
889 1.9 mycroft cp += len;
890 1.9 mycroft *mp = m;
891 1.9 mycroft mp = &m->m_next;
892 1.9 mycroft totlen -= len;
893 1.9 mycroft if (cp == epkt)
894 1.9 mycroft cp = buf;
895 1.9 mycroft }
896 1.9 mycroft return (top);
897 1.18 thorpej }
898 1.18 thorpej
899 1.18 thorpej /*
900 1.18 thorpej * Copy data from a buffer back into the indicated mbuf chain,
901 1.18 thorpej * starting "off" bytes from the beginning, extending the mbuf
902 1.18 thorpej * chain if necessary.
903 1.18 thorpej */
904 1.18 thorpej void
905 1.18 thorpej m_copyback(m0, off, len, cp)
906 1.18 thorpej struct mbuf *m0;
907 1.27 matt int off;
908 1.27 matt int len;
909 1.18 thorpej caddr_t cp;
910 1.18 thorpej {
911 1.27 matt int mlen;
912 1.27 matt struct mbuf *m = m0, *n;
913 1.18 thorpej int totlen = 0;
914 1.18 thorpej
915 1.18 thorpej if (m0 == 0)
916 1.18 thorpej return;
917 1.18 thorpej while (off > (mlen = m->m_len)) {
918 1.18 thorpej off -= mlen;
919 1.18 thorpej totlen += mlen;
920 1.18 thorpej if (m->m_next == 0) {
921 1.18 thorpej n = m_getclr(M_DONTWAIT, m->m_type);
922 1.18 thorpej if (n == 0)
923 1.18 thorpej goto out;
924 1.18 thorpej n->m_len = min(MLEN, len + off);
925 1.18 thorpej m->m_next = n;
926 1.18 thorpej }
927 1.18 thorpej m = m->m_next;
928 1.18 thorpej }
929 1.18 thorpej while (len > 0) {
930 1.18 thorpej mlen = min (m->m_len - off, len);
931 1.30 perry memcpy(mtod(m, caddr_t) + off, cp, (unsigned)mlen);
932 1.18 thorpej cp += mlen;
933 1.18 thorpej len -= mlen;
934 1.18 thorpej mlen += off;
935 1.18 thorpej off = 0;
936 1.18 thorpej totlen += mlen;
937 1.18 thorpej if (len == 0)
938 1.18 thorpej break;
939 1.18 thorpej if (m->m_next == 0) {
940 1.18 thorpej n = m_get(M_DONTWAIT, m->m_type);
941 1.18 thorpej if (n == 0)
942 1.18 thorpej break;
943 1.18 thorpej n->m_len = min(MLEN, len);
944 1.18 thorpej m->m_next = n;
945 1.18 thorpej }
946 1.18 thorpej m = m->m_next;
947 1.18 thorpej }
948 1.18 thorpej out: if (((m = m0)->m_flags & M_PKTHDR) && (m->m_pkthdr.len < totlen))
949 1.18 thorpej m->m_pkthdr.len = totlen;
950 1.1 cgd }
951