1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License, Version 1.0 only
6 * (the "License"). You may not use this file except in compliance
7 * with the License.
8 *
9 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10 * or http://www.opensolaris.org/os/licensing.
11 * See the License for the specific language governing permissions
12 * and limitations under the License.
13 *
14 * When distributing Covered Code, include this CDDL HEADER in each
15 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16 * If applicable, add the following below this CDDL HEADER, with the
17 * fields enclosed by brackets "[]" replaced with your own identifying
18 * information: Portions Copyright [yyyy] [name of copyright owner]
19 *
20 * CDDL HEADER END
21 */
22 /*
23 * Copyright 2005 Sun Microsystems, Inc. All rights reserved.
24 * Use is subject to license terms.
25 */
26
27 #ident "%Z%%M% %I% %E% SMI"
28
29 #include <sys/asm_linkage.h>
30
31 #if defined(lint)
32 #include <sys/types.h>
33 #endif /* lint */
34
35 /*
36 * ip_ocsum(address, halfword_count, sum)
37 * Do a 16 bit one's complement sum of a given number of (16-bit)
38 * halfwords. The halfword pointer must not be odd.
39 * %o0 address; %o1 count; %o2 sum accumulator; %o4 temp
40 * %g2 and %g3 used in main loop
41 *
42 * (from @(#)ocsum.s 1.3 89/02/24 SMI)
43 *
44 */
45
46 #if defined(lint)
47
48 /* ARGSUSED */
49 unsigned int
50 ip_ocsum(u_short *address, int halfword_count, unsigned int sum)
51 { return (0); }
52
53 #else /* lint */
54
55 ENTRY(ip_ocsum)
56 cmp %o1, 31 ! less than 62 bytes?
57 bl,a .dohw ! just do halfwords
58 tst %o1 ! delay slot, test count
59
60 btst 31, %o0 ! (delay slot)
61 bz 2f ! if 32 byte aligned, skip
62 nop
63
64 !
65 ! Do first halfwords until 32-byte aligned
66 !
67 1:
68 lduh [%o0], %g2 ! read data
69 add %o0, 2, %o0 ! increment address
70 add %o2, %g2, %o2 ! add to accumulator, don't need carry yet
71 btst 31, %o0 ! 32 byte aligned?
72 bnz 1b
73 sub %o1, 1, %o1 ! decrement count
74 !
75 ! loop to add in 32 byte chunks
76 ! The loads and adds are staggered to help avoid load/use
77 ! interlocks on highly pipelined implementations, and double
78 ! loads are used for 64-bit wide memory systems.
79 !
80 2:
81 sub %o1, 16, %o1 ! decrement count to aid testing
82 4:
83 ldd [%o0], %g2 ! read data
84 ldd [%o0+8], %o4 ! read more data
85 addcc %o2, %g2, %o2 ! add to accumulator
86 addxcc %o2, %g3, %o2 ! add to accumulator with carry
87 ldd [%o0+16], %g2 ! read more data
88 addxcc %o2, %o4, %o2 ! add to accumulator with carry
89 addxcc %o2, %o5, %o2 ! add to accumulator with carry
90 ldd [%o0+24], %o4 ! read more data
91 addxcc %o2, %g2, %o2 ! add to accumulator with carry
92 addxcc %o2, %g3, %o2 ! add to accumulator with carry
93 addxcc %o2, %o4, %o2 ! add to accumulator
94 addxcc %o2, %o5, %o2 ! add to accumulator with carry
95 addxcc %o2, 0, %o2 ! if final carry, add it in
96 subcc %o1, 16, %o1 ! decrement count (in halfwords)
97 bge 4b
98 add %o0, 32, %o0 ! delay slot, increment address
99
100 add %o1, 16, %o1 ! add back in
101 !
102 ! Do any remaining halfwords
103 !
104 b .dohw
105 tst %o1 ! delay slot, for more to do
106
107 3:
108 add %o0, 2, %o0 ! increment address
109 addcc %o2, %g2, %o2 ! add to accumulator
110 addxcc %o2, 0, %o2 ! if carry, add it in
111 subcc %o1, 1, %o1 ! decrement count
112 .dohw:
113 bg,a 3b ! more to do?
114 lduh [%o0], %g2 ! read data
115
116 !
117 ! at this point the 32-bit accumulator
118 ! has the result that needs to be returned in 16-bits
119 !
120 sll %o2, 16, %o4 ! put low halfword in high halfword %o4
121 addcc %o4, %o2, %o2 ! add the 2 halfwords in high %o2, set carry
122 srl %o2, 16, %o2 ! shift to low halfword
123 retl ! return
124 addxcc %o2, 0, %o0 ! add in carry if any. result in %o0
125 SET_SIZE(ip_ocsum)
126
127 #endif /* lint */