1caf43b02SWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 482cd038dSYoshinobu Inoue * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 582cd038dSYoshinobu Inoue * All rights reserved. 682cd038dSYoshinobu Inoue * 782cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 882cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 982cd038dSYoshinobu Inoue * are met: 1082cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 1182cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 1282cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 1382cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 1482cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 1582cd038dSYoshinobu Inoue * 3. Neither the name of the project nor the names of its contributors 1682cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 1782cd038dSYoshinobu Inoue * without specific prior written permission. 1882cd038dSYoshinobu Inoue * 1982cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 2082cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2182cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2282cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 2382cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2482cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2582cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 2682cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2782cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2882cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 2982cd038dSYoshinobu Inoue * SUCH DAMAGE. 30b48287a3SDavid E. O'Brien * 31b48287a3SDavid E. O'Brien * $KAME: frag6.c,v 1.33 2002/01/07 11:34:48 kjc Exp $ 3282cd038dSYoshinobu Inoue */ 3382cd038dSYoshinobu Inoue 34b48287a3SDavid E. O'Brien #include <sys/cdefs.h> 35b48287a3SDavid E. O'Brien __FBSDID("$FreeBSD$"); 36b48287a3SDavid E. O'Brien 37aaa46574SAdrian Chadd #include "opt_rss.h" 38aaa46574SAdrian Chadd 3982cd038dSYoshinobu Inoue #include <sys/param.h> 401a3044faSBjoern A. Zeeb #include <sys/domain.h> 411a3044faSBjoern A. Zeeb #include <sys/errno.h> 421a3044faSBjoern A. Zeeb #include <sys/eventhandler.h> 4380d7a853SJonathan T. Looney #include <sys/hash.h> 441a3044faSBjoern A. Zeeb #include <sys/kernel.h> 4582cd038dSYoshinobu Inoue #include <sys/malloc.h> 4682cd038dSYoshinobu Inoue #include <sys/mbuf.h> 4782cd038dSYoshinobu Inoue #include <sys/protosw.h> 4882cd038dSYoshinobu Inoue #include <sys/socket.h> 4982cd038dSYoshinobu Inoue #include <sys/time.h> 50757cb678SBjoern A. Zeeb #include <sys/sysctl.h> 5182cd038dSYoshinobu Inoue #include <sys/syslog.h> 5282cd038dSYoshinobu Inoue 5380d7a853SJonathan T. Looney #include <machine/atomic.h> 5480d7a853SJonathan T. Looney 5582cd038dSYoshinobu Inoue #include <net/if.h> 5676039bc8SGleb Smirnoff #include <net/if_var.h> 57aaa46574SAdrian Chadd #include <net/netisr.h> 5882cd038dSYoshinobu Inoue #include <net/route.h> 59eddfbb76SRobert Watson #include <net/vnet.h> 6082cd038dSYoshinobu Inoue 6182cd038dSYoshinobu Inoue #include <netinet/in.h> 6282cd038dSYoshinobu Inoue #include <netinet/in_var.h> 63686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h> 6482cd038dSYoshinobu Inoue #include <netinet6/ip6_var.h> 65686cdd19SJun-ichiro itojun Hagino #include <netinet/icmp6.h> 6659dfcba4SHajimu UMEMOTO #include <netinet/in_systm.h> /* for ECN definitions */ 6759dfcba4SHajimu UMEMOTO #include <netinet/ip.h> /* for ECN definitions */ 6882cd038dSYoshinobu Inoue 691a3044faSBjoern A. Zeeb #ifdef MAC 704b908c8bSRobert Watson #include <security/mac/mac_framework.h> 711a3044faSBjoern A. Zeeb #endif 724b908c8bSRobert Watson 7331e8f7e5SHajimu UMEMOTO /* 7480d7a853SJonathan T. Looney * Reassembly headers are stored in hash buckets. 7531e8f7e5SHajimu UMEMOTO */ 762ceeacbeSJonathan T. Looney #define IP6REASS_NHASH_LOG2 10 7780d7a853SJonathan T. Looney #define IP6REASS_NHASH (1 << IP6REASS_NHASH_LOG2) 7880d7a853SJonathan T. Looney #define IP6REASS_HMASK (IP6REASS_NHASH - 1) 7980d7a853SJonathan T. Looney 8080d7a853SJonathan T. Looney static void frag6_enq(struct ip6asfrag *, struct ip6asfrag *, 8180d7a853SJonathan T. Looney uint32_t bucket __unused); 8280d7a853SJonathan T. Looney static void frag6_deq(struct ip6asfrag *, uint32_t bucket __unused); 8380d7a853SJonathan T. Looney static void frag6_insque_head(struct ip6q *, struct ip6q *, 841e9f3b73SJonathan T. Looney uint32_t bucket); 851e9f3b73SJonathan T. Looney static void frag6_remque(struct ip6q *, uint32_t bucket); 866bbdbbb8SHans Petter Selasky static void frag6_freef(struct ip6q *, uint32_t bucket); 8780d7a853SJonathan T. Looney 8880d7a853SJonathan T. Looney struct ip6qbucket { 8980d7a853SJonathan T. Looney struct ip6q ip6q; 9080d7a853SJonathan T. Looney struct mtx lock; 911e9f3b73SJonathan T. Looney int count; 9280d7a853SJonathan T. Looney }; 9380d7a853SJonathan T. Looney 94757cb678SBjoern A. Zeeb /* System wide (global) maximum and count of packets in reassembly queues. */ 95757cb678SBjoern A. Zeeb static int ip6_maxfrags; 96757cb678SBjoern A. Zeeb static volatile u_int frag6_nfrags = 0; 97757cb678SBjoern A. Zeeb 98757cb678SBjoern A. Zeeb /* Maximum and current packets in per-VNET reassembly queue. */ 99757cb678SBjoern A. Zeeb VNET_DEFINE_STATIC(int, ip6_maxfragpackets); 10080d7a853SJonathan T. Looney VNET_DEFINE_STATIC(volatile u_int, frag6_nfragpackets); 101757cb678SBjoern A. Zeeb #define V_ip6_maxfragpackets VNET(ip6_maxfragpackets) 102757cb678SBjoern A. Zeeb #define V_frag6_nfragpackets VNET(frag6_nfragpackets) 103757cb678SBjoern A. Zeeb 104757cb678SBjoern A. Zeeb /* Maximum per-VNET reassembly queues per bucket and fragments per packet. */ 105757cb678SBjoern A. Zeeb VNET_DEFINE_STATIC(int, ip6_maxfragbucketsize); 106757cb678SBjoern A. Zeeb VNET_DEFINE_STATIC(int, ip6_maxfragsperpacket); 107757cb678SBjoern A. Zeeb #define V_ip6_maxfragbucketsize VNET(ip6_maxfragbucketsize) 108757cb678SBjoern A. Zeeb #define V_ip6_maxfragsperpacket VNET(ip6_maxfragsperpacket) 109757cb678SBjoern A. Zeeb 110757cb678SBjoern A. Zeeb /* Per-VNET reassembly queue buckets. */ 11180d7a853SJonathan T. Looney VNET_DEFINE_STATIC(struct ip6qbucket, ip6q[IP6REASS_NHASH]); 11280d7a853SJonathan T. Looney VNET_DEFINE_STATIC(uint32_t, ip6q_hashseed); 1131e77c105SRobert Watson #define V_ip6q VNET(ip6q) 11480d7a853SJonathan T. Looney #define V_ip6q_hashseed VNET(ip6q_hashseed) 11582cd038dSYoshinobu Inoue 11680d7a853SJonathan T. Looney #define IP6Q_LOCK(i) mtx_lock(&V_ip6q[(i)].lock) 11780d7a853SJonathan T. Looney #define IP6Q_TRYLOCK(i) mtx_trylock(&V_ip6q[(i)].lock) 11880d7a853SJonathan T. Looney #define IP6Q_LOCK_ASSERT(i) mtx_assert(&V_ip6q[(i)].lock, MA_OWNED) 11980d7a853SJonathan T. Looney #define IP6Q_UNLOCK(i) mtx_unlock(&V_ip6q[(i)].lock) 12080d7a853SJonathan T. Looney #define IP6Q_HEAD(i) (&V_ip6q[(i)].ip6q) 1219888c401SHajimu UMEMOTO 122959b7375SPoul-Henning Kamp static MALLOC_DEFINE(M_FTABLE, "fragment", "fragment reassembly header"); 123686cdd19SJun-ichiro itojun Hagino 12482cd038dSYoshinobu Inoue /* 1252ceeacbeSJonathan T. Looney * By default, limit the number of IP6 fragments across all reassembly 1262ceeacbeSJonathan T. Looney * queues to 1/32 of the total number of mbuf clusters. 1272ceeacbeSJonathan T. Looney * 1282ceeacbeSJonathan T. Looney * Limit the total number of reassembly queues per VNET to the 1292ceeacbeSJonathan T. Looney * IP6 fragment limit, but ensure the limit will not allow any bucket 1302ceeacbeSJonathan T. Looney * to grow above 100 items. (The bucket limit is 1312ceeacbeSJonathan T. Looney * IP_MAXFRAGPACKETS / (IPREASS_NHASH / 2), so the 50 is the correct 1322ceeacbeSJonathan T. Looney * multiplier to reach a 100-item limit.) 1332ceeacbeSJonathan T. Looney * The 100-item limit was chosen as brief testing seems to show that 1342ceeacbeSJonathan T. Looney * this produces "reasonable" performance on some subset of systems 1352ceeacbeSJonathan T. Looney * under DoS attack. 1362ceeacbeSJonathan T. Looney */ 1372ceeacbeSJonathan T. Looney #define IP6_MAXFRAGS (nmbclusters / 32) 1382ceeacbeSJonathan T. Looney #define IP6_MAXFRAGPACKETS (imin(IP6_MAXFRAGS, IP6REASS_NHASH * 50)) 1392ceeacbeSJonathan T. Looney 140757cb678SBjoern A. Zeeb 1412ceeacbeSJonathan T. Looney /* 142757cb678SBjoern A. Zeeb * Sysctls and helper function. 14382cd038dSYoshinobu Inoue */ 144757cb678SBjoern A. Zeeb SYSCTL_DECL(_net_inet6_ip6); 145757cb678SBjoern A. Zeeb 146757cb678SBjoern A. Zeeb static void 1471e9f3b73SJonathan T. Looney frag6_set_bucketsize() 1481e9f3b73SJonathan T. Looney { 1491e9f3b73SJonathan T. Looney int i; 1501e9f3b73SJonathan T. Looney 1511e9f3b73SJonathan T. Looney if ((i = V_ip6_maxfragpackets) > 0) 1521e9f3b73SJonathan T. Looney V_ip6_maxfragbucketsize = imax(i / (IP6REASS_NHASH / 2), 1); 1531e9f3b73SJonathan T. Looney } 1541e9f3b73SJonathan T. Looney 155757cb678SBjoern A. Zeeb SYSCTL_INT(_net_inet6_ip6, IPV6CTL_MAXFRAGS, maxfrags, 156757cb678SBjoern A. Zeeb CTLFLAG_RW, &ip6_maxfrags, 0, 157757cb678SBjoern A. Zeeb "Maximum allowed number of outstanding IPv6 packet fragments. " 158757cb678SBjoern A. Zeeb "A value of 0 means no fragmented packets will be accepted, while a " 159757cb678SBjoern A. Zeeb "a value of -1 means no limit"); 160757cb678SBjoern A. Zeeb 161757cb678SBjoern A. Zeeb static int 162757cb678SBjoern A. Zeeb sysctl_ip6_maxfragpackets(SYSCTL_HANDLER_ARGS) 163757cb678SBjoern A. Zeeb { 164757cb678SBjoern A. Zeeb int error, val; 165757cb678SBjoern A. Zeeb 166757cb678SBjoern A. Zeeb val = V_ip6_maxfragpackets; 167757cb678SBjoern A. Zeeb error = sysctl_handle_int(oidp, &val, 0, req); 168757cb678SBjoern A. Zeeb if (error != 0 || !req->newptr) 169757cb678SBjoern A. Zeeb return (error); 170757cb678SBjoern A. Zeeb V_ip6_maxfragpackets = val; 171757cb678SBjoern A. Zeeb frag6_set_bucketsize(); 172757cb678SBjoern A. Zeeb return (0); 173757cb678SBjoern A. Zeeb } 174757cb678SBjoern A. Zeeb SYSCTL_PROC(_net_inet6_ip6, IPV6CTL_MAXFRAGPACKETS, maxfragpackets, 175757cb678SBjoern A. Zeeb CTLFLAG_VNET | CTLTYPE_INT | CTLFLAG_RW, NULL, 0, 176757cb678SBjoern A. Zeeb sysctl_ip6_maxfragpackets, "I", 177757cb678SBjoern A. Zeeb "Default maximum number of outstanding fragmented IPv6 packets. " 178757cb678SBjoern A. Zeeb "A value of 0 means no fragmented packets will be accepted, while a " 179757cb678SBjoern A. Zeeb "a value of -1 means no limit"); 180757cb678SBjoern A. Zeeb SYSCTL_INT(_net_inet6_ip6, IPV6CTL_MAXFRAGSPERPACKET, maxfragsperpacket, 181757cb678SBjoern A. Zeeb CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(ip6_maxfragsperpacket), 0, 182757cb678SBjoern A. Zeeb "Maximum allowed number of fragments per packet"); 183757cb678SBjoern A. Zeeb SYSCTL_INT(_net_inet6_ip6, IPV6CTL_MAXFRAGBUCKETSIZE, maxfragbucketsize, 184757cb678SBjoern A. Zeeb CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(ip6_maxfragbucketsize), 0, 185757cb678SBjoern A. Zeeb "Maximum number of reassembly queues per hash bucket"); 186757cb678SBjoern A. Zeeb 187757cb678SBjoern A. Zeeb 188757cb678SBjoern A. Zeeb /* 189757cb678SBjoern A. Zeeb * Initialise reassembly queue and fragment identifier. 190757cb678SBjoern A. Zeeb */ 1914f590175SPaul Saab static void 1924f590175SPaul Saab frag6_change(void *tag) 1934f590175SPaul Saab { 1942adfd64fSJonathan T. Looney VNET_ITERATOR_DECL(vnet_iter); 1954f590175SPaul Saab 1962ceeacbeSJonathan T. Looney ip6_maxfrags = IP6_MAXFRAGS; 1972adfd64fSJonathan T. Looney VNET_LIST_RLOCK_NOSLEEP(); 1982adfd64fSJonathan T. Looney VNET_FOREACH(vnet_iter) { 1992adfd64fSJonathan T. Looney CURVNET_SET(vnet_iter); 2002ceeacbeSJonathan T. Looney V_ip6_maxfragpackets = IP6_MAXFRAGPACKETS; 2011e9f3b73SJonathan T. Looney frag6_set_bucketsize(); 2022adfd64fSJonathan T. Looney CURVNET_RESTORE(); 2032adfd64fSJonathan T. Looney } 2042adfd64fSJonathan T. Looney VNET_LIST_RUNLOCK_NOSLEEP(); 2054f590175SPaul Saab } 2064f590175SPaul Saab 20782cd038dSYoshinobu Inoue void 2081272577eSXin LI frag6_init(void) 20982cd038dSYoshinobu Inoue { 21080d7a853SJonathan T. Looney struct ip6q *q6; 21180d7a853SJonathan T. Looney int i; 21282cd038dSYoshinobu Inoue 2132ceeacbeSJonathan T. Looney V_ip6_maxfragpackets = IP6_MAXFRAGPACKETS; 2141e9f3b73SJonathan T. Looney frag6_set_bucketsize(); 21580d7a853SJonathan T. Looney for (i = 0; i < IP6REASS_NHASH; i++) { 21680d7a853SJonathan T. Looney q6 = IP6Q_HEAD(i); 21780d7a853SJonathan T. Looney q6->ip6q_next = q6->ip6q_prev = q6; 21880d7a853SJonathan T. Looney mtx_init(&V_ip6q[i].lock, "ip6qlock", NULL, MTX_DEF); 2191e9f3b73SJonathan T. Looney V_ip6q[i].count = 0; 22080d7a853SJonathan T. Looney } 22180d7a853SJonathan T. Looney V_ip6q_hashseed = arc4random(); 22203c99d76SJonathan T. Looney V_ip6_maxfragsperpacket = 64; 2231ed81b73SMarko Zec if (!IS_DEFAULT_VNET(curvnet)) 2241ed81b73SMarko Zec return; 22596c2b042SJesper Skriver 2262ceeacbeSJonathan T. Looney ip6_maxfrags = IP6_MAXFRAGS; 2271ed81b73SMarko Zec EVENTHANDLER_REGISTER(nmbclusters_change, 2281ed81b73SMarko Zec frag6_change, NULL, EVENTHANDLER_PRI_ANY); 22982cd038dSYoshinobu Inoue } 23082cd038dSYoshinobu Inoue 23182cd038dSYoshinobu Inoue /* 232686cdd19SJun-ichiro itojun Hagino * In RFC2460, fragment and reassembly rule do not agree with each other, 233686cdd19SJun-ichiro itojun Hagino * in terms of next header field handling in fragment header. 234686cdd19SJun-ichiro itojun Hagino * While the sender will use the same value for all of the fragmented packets, 235686cdd19SJun-ichiro itojun Hagino * receiver is suggested not to check the consistency. 236686cdd19SJun-ichiro itojun Hagino * 237686cdd19SJun-ichiro itojun Hagino * fragment rule (p20): 238686cdd19SJun-ichiro itojun Hagino * (2) A Fragment header containing: 239686cdd19SJun-ichiro itojun Hagino * The Next Header value that identifies the first header of 240686cdd19SJun-ichiro itojun Hagino * the Fragmentable Part of the original packet. 241686cdd19SJun-ichiro itojun Hagino * -> next header field is same for all fragments 242686cdd19SJun-ichiro itojun Hagino * 243686cdd19SJun-ichiro itojun Hagino * reassembly rule (p21): 244686cdd19SJun-ichiro itojun Hagino * The Next Header field of the last header of the Unfragmentable 245686cdd19SJun-ichiro itojun Hagino * Part is obtained from the Next Header field of the first 246686cdd19SJun-ichiro itojun Hagino * fragment's Fragment header. 247686cdd19SJun-ichiro itojun Hagino * -> should grab it from the first fragment only 248686cdd19SJun-ichiro itojun Hagino * 249686cdd19SJun-ichiro itojun Hagino * The following note also contradicts with fragment rule - no one is going to 250686cdd19SJun-ichiro itojun Hagino * send different fragment with different next header field. 251686cdd19SJun-ichiro itojun Hagino * 252686cdd19SJun-ichiro itojun Hagino * additional note (p22): 253686cdd19SJun-ichiro itojun Hagino * The Next Header values in the Fragment headers of different 254686cdd19SJun-ichiro itojun Hagino * fragments of the same original packet may differ. Only the value 255686cdd19SJun-ichiro itojun Hagino * from the Offset zero fragment packet is used for reassembly. 256686cdd19SJun-ichiro itojun Hagino * -> should grab it from the first fragment only 257686cdd19SJun-ichiro itojun Hagino * 258686cdd19SJun-ichiro itojun Hagino * There is no explicit reason given in the RFC. Historical reason maybe? 259686cdd19SJun-ichiro itojun Hagino */ 260686cdd19SJun-ichiro itojun Hagino /* 26182cd038dSYoshinobu Inoue * Fragment input 26282cd038dSYoshinobu Inoue */ 26382cd038dSYoshinobu Inoue int 2641272577eSXin LI frag6_input(struct mbuf **mp, int *offp, int proto) 26582cd038dSYoshinobu Inoue { 26682cd038dSYoshinobu Inoue struct mbuf *m = *mp, *t; 26782cd038dSYoshinobu Inoue struct ip6_hdr *ip6; 26882cd038dSYoshinobu Inoue struct ip6_frag *ip6f; 26980d7a853SJonathan T. Looney struct ip6q *head, *q6; 270686cdd19SJun-ichiro itojun Hagino struct ip6asfrag *af6, *ip6af, *af6dwn; 2712a5aafceSHajimu UMEMOTO struct in6_ifaddr *ia; 27282cd038dSYoshinobu Inoue int offset = *offp, nxt, i, next; 27382cd038dSYoshinobu Inoue int first_frag = 0; 274686cdd19SJun-ichiro itojun Hagino int fragoff, frgpartlen; /* must be larger than u_int16_t */ 275505e91f5SKristof Provost uint32_t hashkey[(sizeof(struct in6_addr) * 2 + 276505e91f5SKristof Provost sizeof(ip6f->ip6f_ident)) / sizeof(uint32_t)]; 277505e91f5SKristof Provost uint32_t hash, *hashkeyp; 27882cd038dSYoshinobu Inoue struct ifnet *dstifp; 27959dfcba4SHajimu UMEMOTO u_int8_t ecn, ecn0; 280aaa46574SAdrian Chadd #ifdef RSS 281aaa46574SAdrian Chadd struct m_tag *mtag; 282aaa46574SAdrian Chadd struct ip6_direct_ctx *ip6dc; 283aaa46574SAdrian Chadd #endif 284aaa46574SAdrian Chadd 2851d54aa3bSBjoern A. Zeeb #if 0 2861d54aa3bSBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN]; 2871d54aa3bSBjoern A. Zeeb #endif 28882cd038dSYoshinobu Inoue 28982cd038dSYoshinobu Inoue ip6 = mtod(m, struct ip6_hdr *); 290686cdd19SJun-ichiro itojun Hagino #ifndef PULLDOWN_TEST 291686cdd19SJun-ichiro itojun Hagino IP6_EXTHDR_CHECK(m, offset, sizeof(struct ip6_frag), IPPROTO_DONE); 29282cd038dSYoshinobu Inoue ip6f = (struct ip6_frag *)((caddr_t)ip6 + offset); 293686cdd19SJun-ichiro itojun Hagino #else 294686cdd19SJun-ichiro itojun Hagino IP6_EXTHDR_GET(ip6f, struct ip6_frag *, m, offset, sizeof(*ip6f)); 295686cdd19SJun-ichiro itojun Hagino if (ip6f == NULL) 29640e39bbbSHajimu UMEMOTO return (IPPROTO_DONE); 297686cdd19SJun-ichiro itojun Hagino #endif 29882cd038dSYoshinobu Inoue 29982cd038dSYoshinobu Inoue dstifp = NULL; 30082cd038dSYoshinobu Inoue /* find the destination interface of the packet. */ 3013e88eb90SAndrey V. Elsukov ia = in6ifa_ifwithaddr(&ip6->ip6_dst, 0 /* XXX */); 3023e88eb90SAndrey V. Elsukov if (ia != NULL) { 3032a5aafceSHajimu UMEMOTO dstifp = ia->ia_ifp; 3048c0fec80SRobert Watson ifa_free(&ia->ia_ifa); 3058c0fec80SRobert Watson } 30682cd038dSYoshinobu Inoue /* jumbo payload can't contain a fragment header */ 30782cd038dSYoshinobu Inoue if (ip6->ip6_plen == 0) { 30882cd038dSYoshinobu Inoue icmp6_error(m, ICMP6_PARAM_PROB, ICMP6_PARAMPROB_HEADER, offset); 30982cd038dSYoshinobu Inoue in6_ifstat_inc(dstifp, ifs6_reass_fail); 31082cd038dSYoshinobu Inoue return IPPROTO_DONE; 31182cd038dSYoshinobu Inoue } 31282cd038dSYoshinobu Inoue 31382cd038dSYoshinobu Inoue /* 31482cd038dSYoshinobu Inoue * check whether fragment packet's fragment length is 31582cd038dSYoshinobu Inoue * multiple of 8 octets. 31682cd038dSYoshinobu Inoue * sizeof(struct ip6_frag) == 8 31782cd038dSYoshinobu Inoue * sizeof(struct ip6_hdr) = 40 31882cd038dSYoshinobu Inoue */ 31982cd038dSYoshinobu Inoue if ((ip6f->ip6f_offlg & IP6F_MORE_FRAG) && 32082cd038dSYoshinobu Inoue (((ntohs(ip6->ip6_plen) - offset) & 0x7) != 0)) { 32106cd0a3fSHajimu UMEMOTO icmp6_error(m, ICMP6_PARAM_PROB, ICMP6_PARAMPROB_HEADER, 322686cdd19SJun-ichiro itojun Hagino offsetof(struct ip6_hdr, ip6_plen)); 32382cd038dSYoshinobu Inoue in6_ifstat_inc(dstifp, ifs6_reass_fail); 32482cd038dSYoshinobu Inoue return IPPROTO_DONE; 32582cd038dSYoshinobu Inoue } 32682cd038dSYoshinobu Inoue 3279cb8d207SAndrey V. Elsukov IP6STAT_INC(ip6s_fragments); 32882cd038dSYoshinobu Inoue in6_ifstat_inc(dstifp, ifs6_reass_reqd); 32982cd038dSYoshinobu Inoue 330686cdd19SJun-ichiro itojun Hagino /* offset now points to data portion */ 33182cd038dSYoshinobu Inoue offset += sizeof(struct ip6_frag); 33282cd038dSYoshinobu Inoue 3334018ea9aSBjoern A. Zeeb /* 3342946a941STom Jones * Handle "atomic" fragments (offset and m bit set to 0) upfront, 3352946a941STom Jones * unrelated to any reassembly (see RFC 6946 and section 4.5 of RFC 3362946a941STom Jones * 8200). Just skip the fragment header. 3374018ea9aSBjoern A. Zeeb */ 3384018ea9aSBjoern A. Zeeb if ((ip6f->ip6f_offlg & ~IP6F_RESERVED_MASK) == 0) { 3392946a941STom Jones IP6STAT_INC(ip6s_atomicfrags); 3404018ea9aSBjoern A. Zeeb in6_ifstat_inc(dstifp, ifs6_reass_ok); 3414018ea9aSBjoern A. Zeeb *offp = offset; 342a4061289SAndrey V. Elsukov m->m_flags |= M_FRAGMENTED; 3434018ea9aSBjoern A. Zeeb return (ip6f->ip6f_nxt); 3444018ea9aSBjoern A. Zeeb } 3454018ea9aSBjoern A. Zeeb 3465f9f192dSJonathan T. Looney /* Get fragment length and discard 0-byte fragments. */ 3475f9f192dSJonathan T. Looney frgpartlen = sizeof(struct ip6_hdr) + ntohs(ip6->ip6_plen) - offset; 3485f9f192dSJonathan T. Looney if (frgpartlen == 0) { 3495f9f192dSJonathan T. Looney icmp6_error(m, ICMP6_PARAM_PROB, ICMP6_PARAMPROB_HEADER, 3505f9f192dSJonathan T. Looney offsetof(struct ip6_hdr, ip6_plen)); 3515f9f192dSJonathan T. Looney in6_ifstat_inc(dstifp, ifs6_reass_fail); 3525f9f192dSJonathan T. Looney IP6STAT_INC(ip6s_fragdropped); 3535f9f192dSJonathan T. Looney return IPPROTO_DONE; 3545f9f192dSJonathan T. Looney } 3555f9f192dSJonathan T. Looney 35680d7a853SJonathan T. Looney hashkeyp = hashkey; 35780d7a853SJonathan T. Looney memcpy(hashkeyp, &ip6->ip6_src, sizeof(struct in6_addr)); 35880d7a853SJonathan T. Looney hashkeyp += sizeof(struct in6_addr) / sizeof(*hashkeyp); 35980d7a853SJonathan T. Looney memcpy(hashkeyp, &ip6->ip6_dst, sizeof(struct in6_addr)); 36080d7a853SJonathan T. Looney hashkeyp += sizeof(struct in6_addr) / sizeof(*hashkeyp); 36180d7a853SJonathan T. Looney *hashkeyp = ip6f->ip6f_ident; 36280d7a853SJonathan T. Looney hash = jenkins_hash32(hashkey, nitems(hashkey), V_ip6q_hashseed); 36380d7a853SJonathan T. Looney hash &= IP6REASS_HMASK; 36480d7a853SJonathan T. Looney head = IP6Q_HEAD(hash); 36580d7a853SJonathan T. Looney IP6Q_LOCK(hash); 3669888c401SHajimu UMEMOTO 3679888c401SHajimu UMEMOTO /* 3689888c401SHajimu UMEMOTO * Enforce upper bound on number of fragments. 3699888c401SHajimu UMEMOTO * If maxfrag is 0, never accept fragments. 3709888c401SHajimu UMEMOTO * If maxfrag is -1, accept all fragments without limitation. 3719888c401SHajimu UMEMOTO */ 3722adfd64fSJonathan T. Looney if (ip6_maxfrags < 0) 3739888c401SHajimu UMEMOTO ; 3742adfd64fSJonathan T. Looney else if (atomic_load_int(&frag6_nfrags) >= (u_int)ip6_maxfrags) 3759888c401SHajimu UMEMOTO goto dropfrag; 37633841545SHajimu UMEMOTO 37780d7a853SJonathan T. Looney for (q6 = head->ip6q_next; q6 != head; q6 = q6->ip6q_next) 37882cd038dSYoshinobu Inoue if (ip6f->ip6f_ident == q6->ip6q_ident && 37982cd038dSYoshinobu Inoue IN6_ARE_ADDR_EQUAL(&ip6->ip6_src, &q6->ip6q_src) && 3804b908c8bSRobert Watson IN6_ARE_ADDR_EQUAL(&ip6->ip6_dst, &q6->ip6q_dst) 3814b908c8bSRobert Watson #ifdef MAC 3824b908c8bSRobert Watson && mac_ip6q_match(m, q6) 3834b908c8bSRobert Watson #endif 3844b908c8bSRobert Watson ) 38582cd038dSYoshinobu Inoue break; 38682cd038dSYoshinobu Inoue 38780d7a853SJonathan T. Looney if (q6 == head) { 38882cd038dSYoshinobu Inoue /* 38982cd038dSYoshinobu Inoue * the first fragment to arrive, create a reassembly queue. 39082cd038dSYoshinobu Inoue */ 39182cd038dSYoshinobu Inoue first_frag = 1; 39282cd038dSYoshinobu Inoue 39382cd038dSYoshinobu Inoue /* 39482cd038dSYoshinobu Inoue * Enforce upper bound on number of fragmented packets 39582cd038dSYoshinobu Inoue * for which we attempt reassembly; 3969888c401SHajimu UMEMOTO * If maxfragpackets is 0, never accept fragments. 3979888c401SHajimu UMEMOTO * If maxfragpackets is -1, accept all fragments without 3989888c401SHajimu UMEMOTO * limitation. 39982cd038dSYoshinobu Inoue */ 400603724d3SBjoern A. Zeeb if (V_ip6_maxfragpackets < 0) 40133841545SHajimu UMEMOTO ; 4021e9f3b73SJonathan T. Looney else if (V_ip6q[hash].count >= V_ip6_maxfragbucketsize || 4031e9f3b73SJonathan T. Looney atomic_load_int(&V_frag6_nfragpackets) >= 40480d7a853SJonathan T. Looney (u_int)V_ip6_maxfragpackets) 40533841545SHajimu UMEMOTO goto dropfrag; 40680d7a853SJonathan T. Looney atomic_add_int(&V_frag6_nfragpackets, 1); 40782cd038dSYoshinobu Inoue q6 = (struct ip6q *)malloc(sizeof(struct ip6q), M_FTABLE, 4088c0dd0e4SHajimu UMEMOTO M_NOWAIT); 40982cd038dSYoshinobu Inoue if (q6 == NULL) 41082cd038dSYoshinobu Inoue goto dropfrag; 411686cdd19SJun-ichiro itojun Hagino bzero(q6, sizeof(*q6)); 4124b908c8bSRobert Watson #ifdef MAC 4134b908c8bSRobert Watson if (mac_ip6q_init(q6, M_NOWAIT) != 0) { 4144b908c8bSRobert Watson free(q6, M_FTABLE); 4154b908c8bSRobert Watson goto dropfrag; 4164b908c8bSRobert Watson } 4174b908c8bSRobert Watson mac_ip6q_create(m, q6); 4184b908c8bSRobert Watson #endif 41980d7a853SJonathan T. Looney frag6_insque_head(q6, head, hash); 42082cd038dSYoshinobu Inoue 421686cdd19SJun-ichiro itojun Hagino /* ip6q_nxt will be filled afterwards, from 1st fragment */ 42282cd038dSYoshinobu Inoue q6->ip6q_down = q6->ip6q_up = (struct ip6asfrag *)q6; 423686cdd19SJun-ichiro itojun Hagino #ifdef notyet 424686cdd19SJun-ichiro itojun Hagino q6->ip6q_nxtp = (u_char *)nxtp; 425686cdd19SJun-ichiro itojun Hagino #endif 42682cd038dSYoshinobu Inoue q6->ip6q_ident = ip6f->ip6f_ident; 42782cd038dSYoshinobu Inoue q6->ip6q_ttl = IPV6_FRAGTTL; 42882cd038dSYoshinobu Inoue q6->ip6q_src = ip6->ip6_src; 42982cd038dSYoshinobu Inoue q6->ip6q_dst = ip6->ip6_dst; 4305e9510e3SJINMEI Tatuya q6->ip6q_ecn = 4315e9510e3SJINMEI Tatuya (ntohl(ip6->ip6_flow) >> 20) & IPTOS_ECN_MASK; 43282cd038dSYoshinobu Inoue q6->ip6q_unfrglen = -1; /* The 1st fragment has not arrived. */ 4339888c401SHajimu UMEMOTO 4349888c401SHajimu UMEMOTO q6->ip6q_nfrag = 0; 43582cd038dSYoshinobu Inoue } 43682cd038dSYoshinobu Inoue 43782cd038dSYoshinobu Inoue /* 43882cd038dSYoshinobu Inoue * If it's the 1st fragment, record the length of the 43982cd038dSYoshinobu Inoue * unfragmentable part and the next header of the fragment header. 44082cd038dSYoshinobu Inoue */ 44182cd038dSYoshinobu Inoue fragoff = ntohs(ip6f->ip6f_offlg & IP6F_OFF_MASK); 44282cd038dSYoshinobu Inoue if (fragoff == 0) { 44306cd0a3fSHajimu UMEMOTO q6->ip6q_unfrglen = offset - sizeof(struct ip6_hdr) - 44406cd0a3fSHajimu UMEMOTO sizeof(struct ip6_frag); 44582cd038dSYoshinobu Inoue q6->ip6q_nxt = ip6f->ip6f_nxt; 44682cd038dSYoshinobu Inoue } 44782cd038dSYoshinobu Inoue 44882cd038dSYoshinobu Inoue /* 44982cd038dSYoshinobu Inoue * Check that the reassembled packet would not exceed 65535 bytes 45082cd038dSYoshinobu Inoue * in size. 45182cd038dSYoshinobu Inoue * If it would exceed, discard the fragment and return an ICMP error. 45282cd038dSYoshinobu Inoue */ 45382cd038dSYoshinobu Inoue if (q6->ip6q_unfrglen >= 0) { 45482cd038dSYoshinobu Inoue /* The 1st fragment has already arrived. */ 45582cd038dSYoshinobu Inoue if (q6->ip6q_unfrglen + fragoff + frgpartlen > IPV6_MAXPACKET) { 45682cd038dSYoshinobu Inoue icmp6_error(m, ICMP6_PARAM_PROB, ICMP6_PARAMPROB_HEADER, 457686cdd19SJun-ichiro itojun Hagino offset - sizeof(struct ip6_frag) + 458686cdd19SJun-ichiro itojun Hagino offsetof(struct ip6_frag, ip6f_offlg)); 45980d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 46082cd038dSYoshinobu Inoue return (IPPROTO_DONE); 46182cd038dSYoshinobu Inoue } 46206cd0a3fSHajimu UMEMOTO } else if (fragoff + frgpartlen > IPV6_MAXPACKET) { 46382cd038dSYoshinobu Inoue icmp6_error(m, ICMP6_PARAM_PROB, ICMP6_PARAMPROB_HEADER, 464686cdd19SJun-ichiro itojun Hagino offset - sizeof(struct ip6_frag) + 465686cdd19SJun-ichiro itojun Hagino offsetof(struct ip6_frag, ip6f_offlg)); 46680d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 46782cd038dSYoshinobu Inoue return (IPPROTO_DONE); 46882cd038dSYoshinobu Inoue } 46982cd038dSYoshinobu Inoue /* 47082cd038dSYoshinobu Inoue * If it's the first fragment, do the above check for each 47182cd038dSYoshinobu Inoue * fragment already stored in the reassembly queue. 47282cd038dSYoshinobu Inoue */ 47382cd038dSYoshinobu Inoue if (fragoff == 0) { 47482cd038dSYoshinobu Inoue for (af6 = q6->ip6q_down; af6 != (struct ip6asfrag *)q6; 47582cd038dSYoshinobu Inoue af6 = af6dwn) { 47682cd038dSYoshinobu Inoue af6dwn = af6->ip6af_down; 47782cd038dSYoshinobu Inoue 47882cd038dSYoshinobu Inoue if (q6->ip6q_unfrglen + af6->ip6af_off + af6->ip6af_frglen > 47982cd038dSYoshinobu Inoue IPV6_MAXPACKET) { 48082cd038dSYoshinobu Inoue struct mbuf *merr = IP6_REASS_MBUF(af6); 48182cd038dSYoshinobu Inoue struct ip6_hdr *ip6err; 48282cd038dSYoshinobu Inoue int erroff = af6->ip6af_offset; 48382cd038dSYoshinobu Inoue 48482cd038dSYoshinobu Inoue /* dequeue the fragment. */ 48580d7a853SJonathan T. Looney frag6_deq(af6, hash); 486686cdd19SJun-ichiro itojun Hagino free(af6, M_FTABLE); 48782cd038dSYoshinobu Inoue 48882cd038dSYoshinobu Inoue /* adjust pointer. */ 48982cd038dSYoshinobu Inoue ip6err = mtod(merr, struct ip6_hdr *); 49082cd038dSYoshinobu Inoue 49182cd038dSYoshinobu Inoue /* 49282cd038dSYoshinobu Inoue * Restore source and destination addresses 49382cd038dSYoshinobu Inoue * in the erroneous IPv6 header. 49482cd038dSYoshinobu Inoue */ 49582cd038dSYoshinobu Inoue ip6err->ip6_src = q6->ip6q_src; 49682cd038dSYoshinobu Inoue ip6err->ip6_dst = q6->ip6q_dst; 49782cd038dSYoshinobu Inoue 49882cd038dSYoshinobu Inoue icmp6_error(merr, ICMP6_PARAM_PROB, 49982cd038dSYoshinobu Inoue ICMP6_PARAMPROB_HEADER, 500686cdd19SJun-ichiro itojun Hagino erroff - sizeof(struct ip6_frag) + 501686cdd19SJun-ichiro itojun Hagino offsetof(struct ip6_frag, ip6f_offlg)); 50282cd038dSYoshinobu Inoue } 50382cd038dSYoshinobu Inoue } 50482cd038dSYoshinobu Inoue } 50582cd038dSYoshinobu Inoue 506686cdd19SJun-ichiro itojun Hagino ip6af = (struct ip6asfrag *)malloc(sizeof(struct ip6asfrag), M_FTABLE, 5078c0dd0e4SHajimu UMEMOTO M_NOWAIT); 508686cdd19SJun-ichiro itojun Hagino if (ip6af == NULL) 509686cdd19SJun-ichiro itojun Hagino goto dropfrag; 510686cdd19SJun-ichiro itojun Hagino bzero(ip6af, sizeof(*ip6af)); 51182cd038dSYoshinobu Inoue ip6af->ip6af_mff = ip6f->ip6f_offlg & IP6F_MORE_FRAG; 51282cd038dSYoshinobu Inoue ip6af->ip6af_off = fragoff; 51382cd038dSYoshinobu Inoue ip6af->ip6af_frglen = frgpartlen; 51482cd038dSYoshinobu Inoue ip6af->ip6af_offset = offset; 51582cd038dSYoshinobu Inoue IP6_REASS_MBUF(ip6af) = m; 51682cd038dSYoshinobu Inoue 51782cd038dSYoshinobu Inoue if (first_frag) { 51882cd038dSYoshinobu Inoue af6 = (struct ip6asfrag *)q6; 51982cd038dSYoshinobu Inoue goto insert; 52082cd038dSYoshinobu Inoue } 52182cd038dSYoshinobu Inoue 52282cd038dSYoshinobu Inoue /* 52359dfcba4SHajimu UMEMOTO * Handle ECN by comparing this segment with the first one; 52459dfcba4SHajimu UMEMOTO * if CE is set, do not lose CE. 52559dfcba4SHajimu UMEMOTO * drop if CE and not-ECT are mixed for the same packet. 52659dfcba4SHajimu UMEMOTO */ 52759dfcba4SHajimu UMEMOTO ecn = (ntohl(ip6->ip6_flow) >> 20) & IPTOS_ECN_MASK; 5285e9510e3SJINMEI Tatuya ecn0 = q6->ip6q_ecn; 52959dfcba4SHajimu UMEMOTO if (ecn == IPTOS_ECN_CE) { 53059dfcba4SHajimu UMEMOTO if (ecn0 == IPTOS_ECN_NOTECT) { 53159dfcba4SHajimu UMEMOTO free(ip6af, M_FTABLE); 53259dfcba4SHajimu UMEMOTO goto dropfrag; 53359dfcba4SHajimu UMEMOTO } 53459dfcba4SHajimu UMEMOTO if (ecn0 != IPTOS_ECN_CE) 5355e9510e3SJINMEI Tatuya q6->ip6q_ecn = IPTOS_ECN_CE; 53659dfcba4SHajimu UMEMOTO } 53759dfcba4SHajimu UMEMOTO if (ecn == IPTOS_ECN_NOTECT && ecn0 != IPTOS_ECN_NOTECT) { 53859dfcba4SHajimu UMEMOTO free(ip6af, M_FTABLE); 53959dfcba4SHajimu UMEMOTO goto dropfrag; 54059dfcba4SHajimu UMEMOTO } 54159dfcba4SHajimu UMEMOTO 54259dfcba4SHajimu UMEMOTO /* 54382cd038dSYoshinobu Inoue * Find a segment which begins after this one does. 54482cd038dSYoshinobu Inoue */ 54582cd038dSYoshinobu Inoue for (af6 = q6->ip6q_down; af6 != (struct ip6asfrag *)q6; 54682cd038dSYoshinobu Inoue af6 = af6->ip6af_down) 54782cd038dSYoshinobu Inoue if (af6->ip6af_off > ip6af->ip6af_off) 54882cd038dSYoshinobu Inoue break; 54982cd038dSYoshinobu Inoue 550686cdd19SJun-ichiro itojun Hagino #if 0 551686cdd19SJun-ichiro itojun Hagino /* 552686cdd19SJun-ichiro itojun Hagino * If there is a preceding segment, it may provide some of 553686cdd19SJun-ichiro itojun Hagino * our data already. If so, drop the data from the incoming 554686cdd19SJun-ichiro itojun Hagino * segment. If it provides all of our data, drop us. 555686cdd19SJun-ichiro itojun Hagino */ 556686cdd19SJun-ichiro itojun Hagino if (af6->ip6af_up != (struct ip6asfrag *)q6) { 557686cdd19SJun-ichiro itojun Hagino i = af6->ip6af_up->ip6af_off + af6->ip6af_up->ip6af_frglen 558686cdd19SJun-ichiro itojun Hagino - ip6af->ip6af_off; 559686cdd19SJun-ichiro itojun Hagino if (i > 0) { 560686cdd19SJun-ichiro itojun Hagino if (i >= ip6af->ip6af_frglen) 561686cdd19SJun-ichiro itojun Hagino goto dropfrag; 562686cdd19SJun-ichiro itojun Hagino m_adj(IP6_REASS_MBUF(ip6af), i); 563686cdd19SJun-ichiro itojun Hagino ip6af->ip6af_off += i; 564686cdd19SJun-ichiro itojun Hagino ip6af->ip6af_frglen -= i; 565686cdd19SJun-ichiro itojun Hagino } 566686cdd19SJun-ichiro itojun Hagino } 567686cdd19SJun-ichiro itojun Hagino 568686cdd19SJun-ichiro itojun Hagino /* 569686cdd19SJun-ichiro itojun Hagino * While we overlap succeeding segments trim them or, 570686cdd19SJun-ichiro itojun Hagino * if they are completely covered, dequeue them. 571686cdd19SJun-ichiro itojun Hagino */ 572686cdd19SJun-ichiro itojun Hagino while (af6 != (struct ip6asfrag *)q6 && 573686cdd19SJun-ichiro itojun Hagino ip6af->ip6af_off + ip6af->ip6af_frglen > af6->ip6af_off) { 574686cdd19SJun-ichiro itojun Hagino i = (ip6af->ip6af_off + ip6af->ip6af_frglen) - af6->ip6af_off; 575686cdd19SJun-ichiro itojun Hagino if (i < af6->ip6af_frglen) { 576686cdd19SJun-ichiro itojun Hagino af6->ip6af_frglen -= i; 577686cdd19SJun-ichiro itojun Hagino af6->ip6af_off += i; 578686cdd19SJun-ichiro itojun Hagino m_adj(IP6_REASS_MBUF(af6), i); 579686cdd19SJun-ichiro itojun Hagino break; 580686cdd19SJun-ichiro itojun Hagino } 581686cdd19SJun-ichiro itojun Hagino af6 = af6->ip6af_down; 582686cdd19SJun-ichiro itojun Hagino m_freem(IP6_REASS_MBUF(af6->ip6af_up)); 58380d7a853SJonathan T. Looney frag6_deq(af6->ip6af_up, hash); 584686cdd19SJun-ichiro itojun Hagino } 585686cdd19SJun-ichiro itojun Hagino #else 58682cd038dSYoshinobu Inoue /* 58782cd038dSYoshinobu Inoue * If the incoming framgent overlaps some existing fragments in 58882cd038dSYoshinobu Inoue * the reassembly queue, drop it, since it is dangerous to override 58982cd038dSYoshinobu Inoue * existing fragments from a security point of view. 5909888c401SHajimu UMEMOTO * We don't know which fragment is the bad guy - here we trust 5919888c401SHajimu UMEMOTO * fragment that came in earlier, with no real reason. 5925e9510e3SJINMEI Tatuya * 5935e9510e3SJINMEI Tatuya * Note: due to changes after disabling this part, mbuf passed to 5945e9510e3SJINMEI Tatuya * m_adj() below now does not meet the requirement. 59582cd038dSYoshinobu Inoue */ 59682cd038dSYoshinobu Inoue if (af6->ip6af_up != (struct ip6asfrag *)q6) { 59782cd038dSYoshinobu Inoue i = af6->ip6af_up->ip6af_off + af6->ip6af_up->ip6af_frglen 59882cd038dSYoshinobu Inoue - ip6af->ip6af_off; 59982cd038dSYoshinobu Inoue if (i > 0) { 6002bf76779SMunechika SUMIKAWA #if 0 /* suppress the noisy log */ 60182cd038dSYoshinobu Inoue log(LOG_ERR, "%d bytes of a fragment from %s " 60282cd038dSYoshinobu Inoue "overlaps the previous fragment\n", 6031d54aa3bSBjoern A. Zeeb i, ip6_sprintf(ip6buf, &q6->ip6q_src)); 6042bf76779SMunechika SUMIKAWA #endif 6052bf76779SMunechika SUMIKAWA free(ip6af, M_FTABLE); 60682cd038dSYoshinobu Inoue goto dropfrag; 60782cd038dSYoshinobu Inoue } 60882cd038dSYoshinobu Inoue } 60982cd038dSYoshinobu Inoue if (af6 != (struct ip6asfrag *)q6) { 61082cd038dSYoshinobu Inoue i = (ip6af->ip6af_off + ip6af->ip6af_frglen) - af6->ip6af_off; 61182cd038dSYoshinobu Inoue if (i > 0) { 6122bf76779SMunechika SUMIKAWA #if 0 /* suppress the noisy log */ 61382cd038dSYoshinobu Inoue log(LOG_ERR, "%d bytes of a fragment from %s " 61482cd038dSYoshinobu Inoue "overlaps the succeeding fragment", 6151d54aa3bSBjoern A. Zeeb i, ip6_sprintf(ip6buf, &q6->ip6q_src)); 6162bf76779SMunechika SUMIKAWA #endif 6172bf76779SMunechika SUMIKAWA free(ip6af, M_FTABLE); 61882cd038dSYoshinobu Inoue goto dropfrag; 61982cd038dSYoshinobu Inoue } 62082cd038dSYoshinobu Inoue } 621686cdd19SJun-ichiro itojun Hagino #endif 62282cd038dSYoshinobu Inoue 62382cd038dSYoshinobu Inoue insert: 6244b908c8bSRobert Watson #ifdef MAC 6254b908c8bSRobert Watson if (!first_frag) 6264b908c8bSRobert Watson mac_ip6q_update(m, q6); 6274b908c8bSRobert Watson #endif 62882cd038dSYoshinobu Inoue 62982cd038dSYoshinobu Inoue /* 63082cd038dSYoshinobu Inoue * Stick new segment in its place; 63182cd038dSYoshinobu Inoue * check for complete reassembly. 63203c99d76SJonathan T. Looney * If not complete, check fragment limit. 63382cd038dSYoshinobu Inoue * Move to front of packet queue, as we are 63482cd038dSYoshinobu Inoue * the most recently active fragmented packet. 63582cd038dSYoshinobu Inoue */ 63680d7a853SJonathan T. Looney frag6_enq(ip6af, af6->ip6af_up, hash); 6372adfd64fSJonathan T. Looney atomic_add_int(&frag6_nfrags, 1); 6389888c401SHajimu UMEMOTO q6->ip6q_nfrag++; 639686cdd19SJun-ichiro itojun Hagino #if 0 /* xxx */ 64080d7a853SJonathan T. Looney if (q6 != head->ip6q_next) { 64180d7a853SJonathan T. Looney frag6_remque(q6, hash); 64280d7a853SJonathan T. Looney frag6_insque_head(q6, head, hash); 643686cdd19SJun-ichiro itojun Hagino } 644686cdd19SJun-ichiro itojun Hagino #endif 64582cd038dSYoshinobu Inoue next = 0; 64682cd038dSYoshinobu Inoue for (af6 = q6->ip6q_down; af6 != (struct ip6asfrag *)q6; 64782cd038dSYoshinobu Inoue af6 = af6->ip6af_down) { 64882cd038dSYoshinobu Inoue if (af6->ip6af_off != next) { 64903c99d76SJonathan T. Looney if (q6->ip6q_nfrag > V_ip6_maxfragsperpacket) { 650198fdaedSTom Jones IP6STAT_ADD(ip6s_fragdropped, q6->ip6q_nfrag); 6516bbdbbb8SHans Petter Selasky frag6_freef(q6, hash); 65203c99d76SJonathan T. Looney } 65380d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 65482cd038dSYoshinobu Inoue return IPPROTO_DONE; 65582cd038dSYoshinobu Inoue } 65682cd038dSYoshinobu Inoue next += af6->ip6af_frglen; 65782cd038dSYoshinobu Inoue } 65882cd038dSYoshinobu Inoue if (af6->ip6af_up->ip6af_mff) { 65903c99d76SJonathan T. Looney if (q6->ip6q_nfrag > V_ip6_maxfragsperpacket) { 660198fdaedSTom Jones IP6STAT_ADD(ip6s_fragdropped, q6->ip6q_nfrag); 6616bbdbbb8SHans Petter Selasky frag6_freef(q6, hash); 66203c99d76SJonathan T. Looney } 66380d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 66482cd038dSYoshinobu Inoue return IPPROTO_DONE; 66582cd038dSYoshinobu Inoue } 66682cd038dSYoshinobu Inoue 66782cd038dSYoshinobu Inoue /* 66882cd038dSYoshinobu Inoue * Reassembly is complete; concatenate fragments. 66982cd038dSYoshinobu Inoue */ 67082cd038dSYoshinobu Inoue ip6af = q6->ip6q_down; 67182cd038dSYoshinobu Inoue t = m = IP6_REASS_MBUF(ip6af); 67282cd038dSYoshinobu Inoue af6 = ip6af->ip6af_down; 67380d7a853SJonathan T. Looney frag6_deq(ip6af, hash); 67482cd038dSYoshinobu Inoue while (af6 != (struct ip6asfrag *)q6) { 6759907aba3SAndrey V. Elsukov m->m_pkthdr.csum_flags &= 6769907aba3SAndrey V. Elsukov IP6_REASS_MBUF(af6)->m_pkthdr.csum_flags; 6779907aba3SAndrey V. Elsukov m->m_pkthdr.csum_data += 6789907aba3SAndrey V. Elsukov IP6_REASS_MBUF(af6)->m_pkthdr.csum_data; 6799907aba3SAndrey V. Elsukov 680686cdd19SJun-ichiro itojun Hagino af6dwn = af6->ip6af_down; 68180d7a853SJonathan T. Looney frag6_deq(af6, hash); 68282cd038dSYoshinobu Inoue while (t->m_next) 68382cd038dSYoshinobu Inoue t = t->m_next; 684ba99cc0bSAlexander V. Chernikov m_adj(IP6_REASS_MBUF(af6), af6->ip6af_offset); 68509b0b8c0SNavdeep Parhar m_demote_pkthdr(IP6_REASS_MBUF(af6)); 686ba99cc0bSAlexander V. Chernikov m_cat(t, IP6_REASS_MBUF(af6)); 687686cdd19SJun-ichiro itojun Hagino free(af6, M_FTABLE); 688686cdd19SJun-ichiro itojun Hagino af6 = af6dwn; 68982cd038dSYoshinobu Inoue } 69082cd038dSYoshinobu Inoue 6919907aba3SAndrey V. Elsukov while (m->m_pkthdr.csum_data & 0xffff0000) 6929907aba3SAndrey V. Elsukov m->m_pkthdr.csum_data = (m->m_pkthdr.csum_data & 0xffff) + 6939907aba3SAndrey V. Elsukov (m->m_pkthdr.csum_data >> 16); 6949907aba3SAndrey V. Elsukov 69582cd038dSYoshinobu Inoue /* adjust offset to point where the original next header starts */ 69682cd038dSYoshinobu Inoue offset = ip6af->ip6af_offset - sizeof(struct ip6_frag); 697686cdd19SJun-ichiro itojun Hagino free(ip6af, M_FTABLE); 698686cdd19SJun-ichiro itojun Hagino ip6 = mtod(m, struct ip6_hdr *); 69982cd038dSYoshinobu Inoue ip6->ip6_plen = htons((u_short)next + offset - sizeof(struct ip6_hdr)); 7005e9510e3SJINMEI Tatuya if (q6->ip6q_ecn == IPTOS_ECN_CE) 7015e9510e3SJINMEI Tatuya ip6->ip6_flow |= htonl(IPTOS_ECN_CE << 20); 70282cd038dSYoshinobu Inoue nxt = q6->ip6q_nxt; 703686cdd19SJun-ichiro itojun Hagino #ifdef notyet 704686cdd19SJun-ichiro itojun Hagino *q6->ip6q_nxtp = (u_char)(nxt & 0xff); 705686cdd19SJun-ichiro itojun Hagino #endif 70682cd038dSYoshinobu Inoue 7070b438b0fSGleb Smirnoff if (ip6_deletefraghdr(m, offset, M_NOWAIT) != 0) { 70880d7a853SJonathan T. Looney frag6_remque(q6, hash); 7092adfd64fSJonathan T. Looney atomic_subtract_int(&frag6_nfrags, q6->ip6q_nfrag); 7104b908c8bSRobert Watson #ifdef MAC 7114b908c8bSRobert Watson mac_ip6q_destroy(q6); 7124b908c8bSRobert Watson #endif 713686cdd19SJun-ichiro itojun Hagino free(q6, M_FTABLE); 71480d7a853SJonathan T. Looney atomic_subtract_int(&V_frag6_nfragpackets, 1); 7150b438b0fSGleb Smirnoff 716686cdd19SJun-ichiro itojun Hagino goto dropfrag; 71782cd038dSYoshinobu Inoue } 71882cd038dSYoshinobu Inoue 71982cd038dSYoshinobu Inoue /* 72082cd038dSYoshinobu Inoue * Store NXT to the original. 72182cd038dSYoshinobu Inoue */ 72268e0e5a6SAndrey V. Elsukov m_copyback(m, ip6_get_prevhdr(m, offset), sizeof(uint8_t), 72368e0e5a6SAndrey V. Elsukov (caddr_t)&nxt); 72482cd038dSYoshinobu Inoue 72580d7a853SJonathan T. Looney frag6_remque(q6, hash); 7262adfd64fSJonathan T. Looney atomic_subtract_int(&frag6_nfrags, q6->ip6q_nfrag); 7274b908c8bSRobert Watson #ifdef MAC 7284b908c8bSRobert Watson mac_ip6q_reassemble(q6, m); 7294b908c8bSRobert Watson mac_ip6q_destroy(q6); 7304b908c8bSRobert Watson #endif 73182cd038dSYoshinobu Inoue free(q6, M_FTABLE); 73280d7a853SJonathan T. Looney atomic_subtract_int(&V_frag6_nfragpackets, 1); 73382cd038dSYoshinobu Inoue 73482cd038dSYoshinobu Inoue if (m->m_flags & M_PKTHDR) { /* Isn't it always true? */ 73582cd038dSYoshinobu Inoue int plen = 0; 73682cd038dSYoshinobu Inoue for (t = m; t; t = t->m_next) 73782cd038dSYoshinobu Inoue plen += t->m_len; 73882cd038dSYoshinobu Inoue m->m_pkthdr.len = plen; 73982cd038dSYoshinobu Inoue } 74082cd038dSYoshinobu Inoue 741aaa46574SAdrian Chadd #ifdef RSS 742aaa46574SAdrian Chadd mtag = m_tag_alloc(MTAG_ABI_IPV6, IPV6_TAG_DIRECT, sizeof(*ip6dc), 743aaa46574SAdrian Chadd M_NOWAIT); 744aaa46574SAdrian Chadd if (mtag == NULL) 745aaa46574SAdrian Chadd goto dropfrag; 746aaa46574SAdrian Chadd 747aaa46574SAdrian Chadd ip6dc = (struct ip6_direct_ctx *)(mtag + 1); 748aaa46574SAdrian Chadd ip6dc->ip6dc_nxt = nxt; 749aaa46574SAdrian Chadd ip6dc->ip6dc_off = offset; 750aaa46574SAdrian Chadd 751aaa46574SAdrian Chadd m_tag_prepend(m, mtag); 752aaa46574SAdrian Chadd #endif 753aaa46574SAdrian Chadd 75480d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 7559cb8d207SAndrey V. Elsukov IP6STAT_INC(ip6s_reassembled); 75682cd038dSYoshinobu Inoue in6_ifstat_inc(dstifp, ifs6_reass_ok); 75782cd038dSYoshinobu Inoue 758aaa46574SAdrian Chadd #ifdef RSS 759aaa46574SAdrian Chadd /* 760aaa46574SAdrian Chadd * Queue/dispatch for reprocessing. 761aaa46574SAdrian Chadd */ 762aaa46574SAdrian Chadd netisr_dispatch(NETISR_IPV6_DIRECT, m); 763aaa46574SAdrian Chadd return IPPROTO_DONE; 764aaa46574SAdrian Chadd #endif 765aaa46574SAdrian Chadd 76682cd038dSYoshinobu Inoue /* 76782cd038dSYoshinobu Inoue * Tell launch routine the next header 76882cd038dSYoshinobu Inoue */ 76982cd038dSYoshinobu Inoue 77082cd038dSYoshinobu Inoue *mp = m; 77182cd038dSYoshinobu Inoue *offp = offset; 77282cd038dSYoshinobu Inoue 77382cd038dSYoshinobu Inoue return nxt; 77482cd038dSYoshinobu Inoue 77582cd038dSYoshinobu Inoue dropfrag: 77680d7a853SJonathan T. Looney IP6Q_UNLOCK(hash); 77782cd038dSYoshinobu Inoue in6_ifstat_inc(dstifp, ifs6_reass_fail); 7789cb8d207SAndrey V. Elsukov IP6STAT_INC(ip6s_fragdropped); 77982cd038dSYoshinobu Inoue m_freem(m); 78082cd038dSYoshinobu Inoue return IPPROTO_DONE; 78182cd038dSYoshinobu Inoue } 78282cd038dSYoshinobu Inoue 78382cd038dSYoshinobu Inoue /* 78482cd038dSYoshinobu Inoue * Free a fragment reassembly header and all 78582cd038dSYoshinobu Inoue * associated datagrams. 78682cd038dSYoshinobu Inoue */ 78780d7a853SJonathan T. Looney static void 7886bbdbbb8SHans Petter Selasky frag6_freef(struct ip6q *q6, uint32_t bucket) 78982cd038dSYoshinobu Inoue { 79082cd038dSYoshinobu Inoue struct ip6asfrag *af6, *down6; 79182cd038dSYoshinobu Inoue 79280d7a853SJonathan T. Looney IP6Q_LOCK_ASSERT(bucket); 7939888c401SHajimu UMEMOTO 79482cd038dSYoshinobu Inoue for (af6 = q6->ip6q_down; af6 != (struct ip6asfrag *)q6; 79582cd038dSYoshinobu Inoue af6 = down6) { 79682cd038dSYoshinobu Inoue struct mbuf *m = IP6_REASS_MBUF(af6); 79782cd038dSYoshinobu Inoue 79882cd038dSYoshinobu Inoue down6 = af6->ip6af_down; 79980d7a853SJonathan T. Looney frag6_deq(af6, bucket); 80082cd038dSYoshinobu Inoue 80182cd038dSYoshinobu Inoue /* 80282cd038dSYoshinobu Inoue * Return ICMP time exceeded error for the 1st fragment. 80382cd038dSYoshinobu Inoue * Just free other fragments. 80482cd038dSYoshinobu Inoue */ 8056bbdbbb8SHans Petter Selasky if (af6->ip6af_off == 0) { 80682cd038dSYoshinobu Inoue struct ip6_hdr *ip6; 80782cd038dSYoshinobu Inoue 80882cd038dSYoshinobu Inoue /* adjust pointer */ 80982cd038dSYoshinobu Inoue ip6 = mtod(m, struct ip6_hdr *); 81082cd038dSYoshinobu Inoue 81106cd0a3fSHajimu UMEMOTO /* restore source and destination addresses */ 81282cd038dSYoshinobu Inoue ip6->ip6_src = q6->ip6q_src; 81382cd038dSYoshinobu Inoue ip6->ip6_dst = q6->ip6q_dst; 81482cd038dSYoshinobu Inoue 81582cd038dSYoshinobu Inoue icmp6_error(m, ICMP6_TIME_EXCEEDED, 81682cd038dSYoshinobu Inoue ICMP6_TIME_EXCEED_REASSEMBLY, 0); 817686cdd19SJun-ichiro itojun Hagino } else 81882cd038dSYoshinobu Inoue m_freem(m); 819686cdd19SJun-ichiro itojun Hagino free(af6, M_FTABLE); 82082cd038dSYoshinobu Inoue } 82180d7a853SJonathan T. Looney frag6_remque(q6, bucket); 8222adfd64fSJonathan T. Looney atomic_subtract_int(&frag6_nfrags, q6->ip6q_nfrag); 8234b908c8bSRobert Watson #ifdef MAC 8244b908c8bSRobert Watson mac_ip6q_destroy(q6); 8254b908c8bSRobert Watson #endif 82682cd038dSYoshinobu Inoue free(q6, M_FTABLE); 82780d7a853SJonathan T. Looney atomic_subtract_int(&V_frag6_nfragpackets, 1); 82882cd038dSYoshinobu Inoue } 82982cd038dSYoshinobu Inoue 83082cd038dSYoshinobu Inoue /* 83182cd038dSYoshinobu Inoue * Put an ip fragment on a reassembly chain. 83282cd038dSYoshinobu Inoue * Like insque, but pointers in middle of structure. 83382cd038dSYoshinobu Inoue */ 83480d7a853SJonathan T. Looney static void 83580d7a853SJonathan T. Looney frag6_enq(struct ip6asfrag *af6, struct ip6asfrag *up6, 83680d7a853SJonathan T. Looney uint32_t bucket __unused) 83782cd038dSYoshinobu Inoue { 8389888c401SHajimu UMEMOTO 83980d7a853SJonathan T. Looney IP6Q_LOCK_ASSERT(bucket); 8409888c401SHajimu UMEMOTO 84182cd038dSYoshinobu Inoue af6->ip6af_up = up6; 84282cd038dSYoshinobu Inoue af6->ip6af_down = up6->ip6af_down; 84382cd038dSYoshinobu Inoue up6->ip6af_down->ip6af_up = af6; 84482cd038dSYoshinobu Inoue up6->ip6af_down = af6; 84582cd038dSYoshinobu Inoue } 84682cd038dSYoshinobu Inoue 84782cd038dSYoshinobu Inoue /* 84882cd038dSYoshinobu Inoue * To frag6_enq as remque is to insque. 84982cd038dSYoshinobu Inoue */ 85080d7a853SJonathan T. Looney static void 85180d7a853SJonathan T. Looney frag6_deq(struct ip6asfrag *af6, uint32_t bucket __unused) 85282cd038dSYoshinobu Inoue { 8539888c401SHajimu UMEMOTO 85480d7a853SJonathan T. Looney IP6Q_LOCK_ASSERT(bucket); 8559888c401SHajimu UMEMOTO 85682cd038dSYoshinobu Inoue af6->ip6af_up->ip6af_down = af6->ip6af_down; 85782cd038dSYoshinobu Inoue af6->ip6af_down->ip6af_up = af6->ip6af_up; 85882cd038dSYoshinobu Inoue } 85982cd038dSYoshinobu Inoue 86080d7a853SJonathan T. Looney static void 8611e9f3b73SJonathan T. Looney frag6_insque_head(struct ip6q *new, struct ip6q *old, uint32_t bucket) 86282cd038dSYoshinobu Inoue { 8639888c401SHajimu UMEMOTO 86480d7a853SJonathan T. Looney IP6Q_LOCK_ASSERT(bucket); 86580d7a853SJonathan T. Looney KASSERT(IP6Q_HEAD(bucket) == old, 86680d7a853SJonathan T. Looney ("%s: attempt to insert at head of wrong bucket" 86780d7a853SJonathan T. Looney " (bucket=%u, old=%p)", __func__, bucket, old)); 8689888c401SHajimu UMEMOTO 86982cd038dSYoshinobu Inoue new->ip6q_prev = old; 87082cd038dSYoshinobu Inoue new->ip6q_next = old->ip6q_next; 87182cd038dSYoshinobu Inoue old->ip6q_next->ip6q_prev= new; 87282cd038dSYoshinobu Inoue old->ip6q_next = new; 8731e9f3b73SJonathan T. Looney V_ip6q[bucket].count++; 87482cd038dSYoshinobu Inoue } 87582cd038dSYoshinobu Inoue 87680d7a853SJonathan T. Looney static void 8771e9f3b73SJonathan T. Looney frag6_remque(struct ip6q *p6, uint32_t bucket) 87882cd038dSYoshinobu Inoue { 8799888c401SHajimu UMEMOTO 88080d7a853SJonathan T. Looney IP6Q_LOCK_ASSERT(bucket); 8819888c401SHajimu UMEMOTO 88282cd038dSYoshinobu Inoue p6->ip6q_prev->ip6q_next = p6->ip6q_next; 88382cd038dSYoshinobu Inoue p6->ip6q_next->ip6q_prev = p6->ip6q_prev; 8841e9f3b73SJonathan T. Looney V_ip6q[bucket].count--; 88582cd038dSYoshinobu Inoue } 88682cd038dSYoshinobu Inoue 88782cd038dSYoshinobu Inoue /* 88833841545SHajimu UMEMOTO * IPv6 reassembling timer processing; 88982cd038dSYoshinobu Inoue * if a timer expires on a reassembly 89082cd038dSYoshinobu Inoue * queue, discard it. 89182cd038dSYoshinobu Inoue */ 89282cd038dSYoshinobu Inoue void 8931272577eSXin LI frag6_slowtimo(void) 89482cd038dSYoshinobu Inoue { 8958b615593SMarko Zec VNET_ITERATOR_DECL(vnet_iter); 89680d7a853SJonathan T. Looney struct ip6q *head, *q6; 89780d7a853SJonathan T. Looney int i; 89882cd038dSYoshinobu Inoue 8995ee847d3SRobert Watson VNET_LIST_RLOCK_NOSLEEP(); 9008b615593SMarko Zec VNET_FOREACH(vnet_iter) { 9018b615593SMarko Zec CURVNET_SET(vnet_iter); 90280d7a853SJonathan T. Looney for (i = 0; i < IP6REASS_NHASH; i++) { 90380d7a853SJonathan T. Looney IP6Q_LOCK(i); 90480d7a853SJonathan T. Looney head = IP6Q_HEAD(i); 90580d7a853SJonathan T. Looney q6 = head->ip6q_next; 9061e9f3b73SJonathan T. Looney if (q6 == NULL) { 9071e9f3b73SJonathan T. Looney /* 9081e9f3b73SJonathan T. Looney * XXXJTL: This should never happen. This 9091e9f3b73SJonathan T. Looney * should turn into an assertion. 9101e9f3b73SJonathan T. Looney */ 9111e9f3b73SJonathan T. Looney IP6Q_UNLOCK(i); 9121e9f3b73SJonathan T. Looney continue; 9131e9f3b73SJonathan T. Looney } 91480d7a853SJonathan T. Looney while (q6 != head) { 91582cd038dSYoshinobu Inoue --q6->ip6q_ttl; 91682cd038dSYoshinobu Inoue q6 = q6->ip6q_next; 91782cd038dSYoshinobu Inoue if (q6->ip6q_prev->ip6q_ttl == 0) { 918198fdaedSTom Jones IP6STAT_ADD(ip6s_fragtimeout, 919198fdaedSTom Jones q6->ip6q_prev->ip6q_nfrag); 92082cd038dSYoshinobu Inoue /* XXX in6_ifstat_inc(ifp, ifs6_reass_fail) */ 9216bbdbbb8SHans Petter Selasky frag6_freef(q6->ip6q_prev, i); 92282cd038dSYoshinobu Inoue } 92382cd038dSYoshinobu Inoue } 92482cd038dSYoshinobu Inoue /* 92582cd038dSYoshinobu Inoue * If we are over the maximum number of fragments 92682cd038dSYoshinobu Inoue * (due to the limit being lowered), drain off 92782cd038dSYoshinobu Inoue * enough to get down to the new limit. 9281e9f3b73SJonathan T. Looney * Note that we drain all reassembly queues if 9291e9f3b73SJonathan T. Looney * maxfragpackets is 0 (fragmentation is disabled), 9301e9f3b73SJonathan T. Looney * and don't enforce a limit when maxfragpackets 9311e9f3b73SJonathan T. Looney * is negative. 93282cd038dSYoshinobu Inoue */ 9331e9f3b73SJonathan T. Looney while ((V_ip6_maxfragpackets == 0 || 9341e9f3b73SJonathan T. Looney (V_ip6_maxfragpackets > 0 && 9351e9f3b73SJonathan T. Looney V_ip6q[i].count > V_ip6_maxfragbucketsize)) && 93680d7a853SJonathan T. Looney head->ip6q_prev != head) { 937198fdaedSTom Jones IP6STAT_ADD(ip6s_fragoverflow, 938198fdaedSTom Jones q6->ip6q_prev->ip6q_nfrag); 93982cd038dSYoshinobu Inoue /* XXX in6_ifstat_inc(ifp, ifs6_reass_fail) */ 9406bbdbbb8SHans Petter Selasky frag6_freef(head->ip6q_prev, i); 94180d7a853SJonathan T. Looney } 94280d7a853SJonathan T. Looney IP6Q_UNLOCK(i); 94382cd038dSYoshinobu Inoue } 9441e9f3b73SJonathan T. Looney /* 9451e9f3b73SJonathan T. Looney * If we are still over the maximum number of fragmented 9461e9f3b73SJonathan T. Looney * packets, drain off enough to get down to the new limit. 9471e9f3b73SJonathan T. Looney */ 9481e9f3b73SJonathan T. Looney i = 0; 9491e9f3b73SJonathan T. Looney while (V_ip6_maxfragpackets >= 0 && 9501e9f3b73SJonathan T. Looney atomic_load_int(&V_frag6_nfragpackets) > 9511e9f3b73SJonathan T. Looney (u_int)V_ip6_maxfragpackets) { 9521e9f3b73SJonathan T. Looney IP6Q_LOCK(i); 9531e9f3b73SJonathan T. Looney head = IP6Q_HEAD(i); 9541e9f3b73SJonathan T. Looney if (head->ip6q_prev != head) { 955198fdaedSTom Jones IP6STAT_ADD(ip6s_fragoverflow, 956198fdaedSTom Jones q6->ip6q_prev->ip6q_nfrag); 9571e9f3b73SJonathan T. Looney /* XXX in6_ifstat_inc(ifp, ifs6_reass_fail) */ 9586bbdbbb8SHans Petter Selasky frag6_freef(head->ip6q_prev, i); 9591e9f3b73SJonathan T. Looney } 9601e9f3b73SJonathan T. Looney IP6Q_UNLOCK(i); 9611e9f3b73SJonathan T. Looney i = (i + 1) % IP6REASS_NHASH; 9621e9f3b73SJonathan T. Looney } 9638b615593SMarko Zec CURVNET_RESTORE(); 9648b615593SMarko Zec } 9655ee847d3SRobert Watson VNET_LIST_RUNLOCK_NOSLEEP(); 96682cd038dSYoshinobu Inoue } 96782cd038dSYoshinobu Inoue 96882cd038dSYoshinobu Inoue /* 96982cd038dSYoshinobu Inoue * Drain off all datagram fragments. 97082cd038dSYoshinobu Inoue */ 97182cd038dSYoshinobu Inoue void 9721272577eSXin LI frag6_drain(void) 97382cd038dSYoshinobu Inoue { 9748b615593SMarko Zec VNET_ITERATOR_DECL(vnet_iter); 97580d7a853SJonathan T. Looney struct ip6q *head; 97680d7a853SJonathan T. Looney int i; 9779888c401SHajimu UMEMOTO 9785ee847d3SRobert Watson VNET_LIST_RLOCK_NOSLEEP(); 9798b615593SMarko Zec VNET_FOREACH(vnet_iter) { 9808b615593SMarko Zec CURVNET_SET(vnet_iter); 98180d7a853SJonathan T. Looney for (i = 0; i < IP6REASS_NHASH; i++) { 98280d7a853SJonathan T. Looney if (IP6Q_TRYLOCK(i) == 0) 98380d7a853SJonathan T. Looney continue; 98480d7a853SJonathan T. Looney head = IP6Q_HEAD(i); 98580d7a853SJonathan T. Looney while (head->ip6q_next != head) { 9869cb8d207SAndrey V. Elsukov IP6STAT_INC(ip6s_fragdropped); 98782cd038dSYoshinobu Inoue /* XXX in6_ifstat_inc(ifp, ifs6_reass_fail) */ 9886bbdbbb8SHans Petter Selasky frag6_freef(head->ip6q_next, i); 98980d7a853SJonathan T. Looney } 99080d7a853SJonathan T. Looney IP6Q_UNLOCK(i); 99182cd038dSYoshinobu Inoue } 9928b615593SMarko Zec CURVNET_RESTORE(); 9938b615593SMarko Zec } 9945ee847d3SRobert Watson VNET_LIST_RUNLOCK_NOSLEEP(); 99582cd038dSYoshinobu Inoue } 996e5ee7060SGleb Smirnoff 997e5ee7060SGleb Smirnoff int 998e5ee7060SGleb Smirnoff ip6_deletefraghdr(struct mbuf *m, int offset, int wait) 999e5ee7060SGleb Smirnoff { 1000e5ee7060SGleb Smirnoff struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *); 1001e5ee7060SGleb Smirnoff struct mbuf *t; 1002e5ee7060SGleb Smirnoff 1003e5ee7060SGleb Smirnoff /* Delete frag6 header. */ 1004e5ee7060SGleb Smirnoff if (m->m_len >= offset + sizeof(struct ip6_frag)) { 1005e5ee7060SGleb Smirnoff /* This is the only possible case with !PULLDOWN_TEST. */ 1006e5ee7060SGleb Smirnoff bcopy(ip6, (char *)ip6 + sizeof(struct ip6_frag), 1007e5ee7060SGleb Smirnoff offset); 1008e5ee7060SGleb Smirnoff m->m_data += sizeof(struct ip6_frag); 1009e5ee7060SGleb Smirnoff m->m_len -= sizeof(struct ip6_frag); 1010e5ee7060SGleb Smirnoff } else { 1011e5ee7060SGleb Smirnoff /* This comes with no copy if the boundary is on cluster. */ 1012e5ee7060SGleb Smirnoff if ((t = m_split(m, offset, wait)) == NULL) 1013e5ee7060SGleb Smirnoff return (ENOMEM); 1014e5ee7060SGleb Smirnoff m_adj(t, sizeof(struct ip6_frag)); 1015e5ee7060SGleb Smirnoff m_cat(m, t); 1016e5ee7060SGleb Smirnoff } 1017e5ee7060SGleb Smirnoff 1018a4061289SAndrey V. Elsukov m->m_flags |= M_FRAGMENTED; 1019e5ee7060SGleb Smirnoff return (0); 1020e5ee7060SGleb Smirnoff } 1021