/*- * Copyright (c) 2012 The NetBSD Foundation, Inc. * All rights reserved. * * This code is derived from software contributed to The NetBSD Foundation * by Matt Thomas of 3am Software Foundry. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include __KERNEL_RCSID(0, "$NetBSD: cpu_in_cksum_neon.c,v 1.1 2012/12/17 00:44:03 matt Exp $"); #include #include #include #include #include uint32_t cpu_in_cksum_neon(const void *, size_t); uint32_t cpu_in_cksum_neon_v4hdr(const void *); int cpu_in_cksum(struct mbuf *m, int len, int off, uint32_t initial_sum) { uint32_t csum = initial_sum; int odd = 0; /* * Taken control of the NEON PCU. */ vfp_hijack(); /* * Fast path for the normal ip_header */ if (off == 0 && csum == 0 && len == sizeof(struct ip) && ((uintptr_t)m->m_data & 3) == 0 && m->m_len >= len) { csum = cpu_in_cksum_neon_v4hdr(m->m_data); /* * We are now down with NEON. */ vfp_surrender(); if (csum == 0x10000) /* note 0x10000 - 0xffff == 1 */ return 1; return csum == 0 ? 0xffff : csum; /* never return 0. */ } /* * Skip the initial mbufs */ while (m->m_len >= off) { m = m->m_next; off -= m->m_len; KASSERT(m != NULL); } for (; len > 0; m = m->m_next, off = 0) { KASSERT(m != NULL); int dlen = MIN(m->m_len - off, len); const void *dptr = m->m_data + off; /* * This routine will add based on the memory layout so * if the previous len was odd or the this buffer starts * on an odd address, shift the csum by 8 so its properly * aligned. It will be taken care of when we do the final * checksum fold. */ uint32_t tmpsum = cpu_in_cksum_neon(dptr, dlen); if (odd ^ ((uint32_t)dptr & 1)) tmpsum <<= 8; /* * Accumulate checksum, folding will be done later */ csum += tmpsum; odd ^= dlen & 1; len -= dlen; } /* * We are now down with NEON. */ vfp_surrender(); /* * Time to fold the checksum */ csum = (csum >> 16) + (csum & 0xffff); /* * Now it could be 0x1xxxx so fold again */ csum = (csum >> 16) + (csum & 0xffff); KASSERT(csum <= 0x10000); if (csum == 0x10000) /* note 0x10000 - 0xffff == 1 */ return 1; return csum == 0 ? 0xffff : csum; /* never return 0. */ }