1 /*
   2  * CDDL HEADER START
   3  *
   4  * The contents of this file are subject to the terms of the
   5  * Common Development and Distribution License, Version 1.0 only
   6  * (the "License").  You may not use this file except in compliance
   7  * with the License.
   8  *
   9  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  10  * or http://www.opensolaris.org/os/licensing.
  11  * See the License for the specific language governing permissions
  12  * and limitations under the License.
  13  *
  14  * When distributing Covered Code, include this CDDL HEADER in each
  15  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  16  * If applicable, add the following below this CDDL HEADER, with the
  17  * fields enclosed by brackets "[]" replaced with your own identifying
  18  * information: Portions Copyright [yyyy] [name of copyright owner]
  19  *
  20  * CDDL HEADER END
  21  */
  22 /*
  23  * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
  24  * Use is subject to license terms.
  25  */
  26 
  27 #ident  "%Z%%M% %I%     %E% SMI"
  28 
  29 #include <sys/asm_linkage.h>
  30 
  31 #if defined(lint)
  32 #include <sys/types.h>
  33 #endif  /* lint */
  34 
  35 /*
  36  * ip_ocsum(address, halfword_count, sum)
  37  * Do a 16 bit one's complement sum of a given number of (16-bit)
  38  * halfwords. The halfword pointer must not be odd.
  39  *      %o0 address; %o1 count; %o2 sum accumulator; %o4 temp
  40  *      %g2 and %g3 used in main loop
  41  *
  42  * (from @(#)ocsum.s 1.3 89/02/24 SMI)
  43  *
  44  */
  45 
  46 #if defined(lint) 
  47 
  48 /* ARGSUSED */
  49 unsigned int
  50 ip_ocsum(u_short *address, int halfword_count, unsigned int sum)
  51 { return (0); }
  52 
  53 #else   /* lint */
  54 
  55         ENTRY(ip_ocsum)
  56         cmp     %o1, 31         ! less than 62 bytes?
  57         bl,a    .dohw           !   just do halfwords
  58         tst     %o1             ! delay slot, test count
  59 
  60         btst    31, %o0         ! (delay slot)
  61         bz      2f              ! if 32 byte aligned, skip
  62         nop
  63 
  64         !
  65         ! Do first halfwords until 32-byte aligned
  66         !
  67 1:
  68         lduh    [%o0], %g2      ! read data
  69         add     %o0, 2, %o0     ! increment address
  70         add     %o2, %g2, %o2   ! add to accumulator, don't need carry yet
  71         btst    31, %o0         ! 32 byte aligned?
  72         bnz     1b
  73         sub     %o1, 1, %o1     ! decrement count
  74         !
  75         ! loop to add in 32 byte chunks
  76         ! The loads and adds are staggered to help avoid load/use
  77         ! interlocks on highly pipelined implementations, and double
  78         ! loads are used for 64-bit wide memory systems.
  79         !
  80 2:
  81         sub     %o1, 16, %o1    ! decrement count to aid testing
  82 4:
  83         ldd     [%o0], %g2      ! read data
  84         ldd     [%o0+8], %o4    ! read more data
  85         addcc   %o2, %g2, %o2   ! add to accumulator
  86         addxcc  %o2, %g3, %o2   ! add to accumulator with carry
  87         ldd     [%o0+16], %g2   ! read more data
  88         addxcc  %o2, %o4, %o2   ! add to accumulator with carry
  89         addxcc  %o2, %o5, %o2   ! add to accumulator with carry
  90         ldd     [%o0+24], %o4   ! read more data
  91         addxcc  %o2, %g2, %o2   ! add to accumulator with carry
  92         addxcc  %o2, %g3, %o2   ! add to accumulator with carry
  93         addxcc  %o2, %o4, %o2   ! add to accumulator
  94         addxcc  %o2, %o5, %o2   ! add to accumulator with carry
  95         addxcc  %o2, 0, %o2     ! if final carry, add it in
  96         subcc   %o1, 16, %o1    ! decrement count (in halfwords)
  97         bge     4b
  98         add     %o0, 32, %o0    ! delay slot, increment address
  99         
 100         add     %o1, 16, %o1    ! add back in
 101         !
 102         ! Do any remaining halfwords
 103         !
 104         b       .dohw
 105         tst     %o1             ! delay slot, for more to do
 106 
 107 3:
 108         add     %o0, 2, %o0     ! increment address
 109         addcc   %o2, %g2, %o2   ! add to accumulator
 110         addxcc  %o2, 0, %o2     ! if carry, add it in
 111         subcc   %o1, 1, %o1     ! decrement count
 112 .dohw:
 113         bg,a    3b              ! more to do?
 114         lduh    [%o0], %g2      ! read data
 115 
 116         !
 117         ! at this point the 32-bit accumulator
 118         ! has the result that needs to be returned in 16-bits
 119         !
 120         sll     %o2, 16, %o4    ! put low halfword in high halfword %o4
 121         addcc   %o4, %o2, %o2   ! add the 2 halfwords in high %o2, set carry
 122         srl     %o2, 16, %o2    ! shift to low halfword
 123         retl                    ! return
 124         addxcc  %o2, 0, %o0     ! add in carry if any. result in %o0
 125         SET_SIZE(ip_ocsum)
 126 
 127 #endif  /* lint */