| 1 | /* |
| 2 | * Copyright (c) 2020-2021 Apple Inc. All rights reserved. |
| 3 | * |
| 4 | * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ |
| 5 | * |
| 6 | * This file contains Original Code and/or Modifications of Original Code |
| 7 | * as defined in and that are subject to the Apple Public Source License |
| 8 | * Version 2.0 (the 'License'). You may not use this file except in |
| 9 | * compliance with the License. The rights granted to you under the License |
| 10 | * may not be used to create, or enable the creation or redistribution of, |
| 11 | * unlawful or unlicensed copies of an Apple operating system, or to |
| 12 | * circumvent, violate, or enable the circumvention or violation of, any |
| 13 | * terms of an Apple operating system software license agreement. |
| 14 | * |
| 15 | * Please obtain a copy of the License at |
| 16 | * http://www.opensource.apple.com/apsl/ and read it before using this file. |
| 17 | * |
| 18 | * The Original Code and all software distributed under the License are |
| 19 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER |
| 20 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, |
| 21 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, |
| 22 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. |
| 23 | * Please see the License for the specific language governing rights and |
| 24 | * limitations under the License. |
| 25 | * |
| 26 | * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ |
| 27 | */ |
| 28 | |
| 29 | /* |
| 30 | * extern int os_memcmp_mask_{16,32,48,64,80}B(const uint8_t *src1, |
| 31 | * const uint8_t *src2, const uint8_t *mask); |
| 32 | * |
| 33 | * This module implements fixed-length memory compare with mask routines, |
| 34 | * used mainly by the Skywalk networking subsystem. Each routine is called |
| 35 | * on every packet and therefore needs to be as efficient as possible. |
| 36 | * |
| 37 | * ARM64 kernel mode -- just like user mode -- no longer requires saving |
| 38 | * the vector registers, since it's done by the exception handler code. |
| 39 | */ |
| 40 | |
| 41 | #ifndef KERNEL |
| 42 | #ifndef LIBSYSCALL_INTERFACE |
| 43 | #error "LIBSYSCALL_INTERFACE not defined" |
| 44 | #endif /* !LIBSYSCALL_INTERFACE */ |
| 45 | #endif /* !KERNEL */ |
| 46 | |
| 47 | #define src1 x0 /* 1st arg */ |
| 48 | #define src2 x1 /* 2nd arg */ |
| 49 | #define mask x2 /* 3rd arg */ |
| 50 | |
| 51 | /* |
| 52 | * @abstract Compare 16-byte buffers src1 against src2, applying the byte |
| 53 | * masks to input data before comparison. |
| 54 | * |
| 55 | * @discussion |
| 56 | * Returns zero if the two buffers are identical after applying the byte |
| 57 | * masks, otherwise non-zero. |
| 58 | * |
| 59 | * @param src1 first 16-byte input buffer |
| 60 | * @param src2 second 16-byte input buffer |
| 61 | * @param byte_mask 16-byte byte mask applied before comparision |
| 62 | */ |
| 63 | .globl _os_memcmp_mask_16B |
| 64 | .text |
| 65 | .align 4 |
| 66 | _os_memcmp_mask_16B: |
| 67 | |
| 68 | ld1.16b {v0}, [src1] |
| 69 | ld1.16b {v1}, [src2] |
| 70 | ld1.16b {v2}, [mask] |
| 71 | eor.16b v0, v0, v1 |
| 72 | and.16b v0, v0, v2 |
| 73 | umaxv b0, v0.16b |
| 74 | umov w0, v0.s[0] |
| 75 | |
| 76 | ret lr |
| 77 | |
| 78 | /* |
| 79 | * @abstract Compare 32-byte buffers src1 against src2, applying the byte |
| 80 | * masks to input data before comparison. |
| 81 | * |
| 82 | * @discussion |
| 83 | * Returns zero if the two buffers are identical after applying the byte |
| 84 | * masks, otherwise non-zero. |
| 85 | * |
| 86 | * @param src1 first 32-byte input buffer |
| 87 | * @param src2 second 32-byte input buffer |
| 88 | * @param byte_mask 32-byte byte mask applied before comparision |
| 89 | */ |
| 90 | .globl _os_memcmp_mask_32B |
| 91 | .text |
| 92 | .align 4 |
| 93 | _os_memcmp_mask_32B: |
| 94 | |
| 95 | ld1.16b {v0, v1}, [src1] |
| 96 | ld1.16b {v2, v3}, [src2] |
| 97 | ld1.16b {v4, v5}, [mask] |
| 98 | eor.16b v0, v0, v2 |
| 99 | eor.16b v1, v1, v3 |
| 100 | and.16b v0, v0, v4 |
| 101 | and.16b v1, v1, v5 |
| 102 | orr.16b v0, v0, v1 |
| 103 | umaxv b0, v0.16b |
| 104 | umov w0, v0.s[0] |
| 105 | |
| 106 | ret lr |
| 107 | |
| 108 | /* |
| 109 | * @abstract Compare 48-byte buffers src1 against src2, applying the byte |
| 110 | * masks to input data before comparison. |
| 111 | * |
| 112 | * @discussion |
| 113 | * Returns zero if the two buffers are identical after applying the byte |
| 114 | * masks, otherwise non-zero. |
| 115 | * |
| 116 | * @param src1 first 48-byte input buffer |
| 117 | * @param src2 second 48-byte input buffer |
| 118 | * @param byte_mask 48-byte byte mask applied before comparision |
| 119 | */ |
| 120 | .globl _os_memcmp_mask_48B |
| 121 | .text |
| 122 | .align 4 |
| 123 | _os_memcmp_mask_48B: |
| 124 | |
| 125 | ld1.16b {v0, v1, v2}, [src1] |
| 126 | ld1.16b {v3, v4, v5}, [src2] |
| 127 | ld1.16b {v16, v17, v18}, [mask] |
| 128 | eor.16b v0, v0, v3 |
| 129 | eor.16b v1, v1, v4 |
| 130 | eor.16b v2, v2, v5 |
| 131 | and.16b v0, v0, v16 |
| 132 | and.16b v1, v1, v17 |
| 133 | and.16b v2, v2, v18 |
| 134 | orr.16b v0, v0, v1 |
| 135 | orr.16b v0, v0, v2 |
| 136 | umaxv b0, v0.16b |
| 137 | umov w0, v0.s[0] |
| 138 | |
| 139 | ret lr |
| 140 | |
| 141 | /* |
| 142 | * @abstract Compare 64-byte buffers src1 against src2, applying the byte |
| 143 | * masks to input data before comparison. |
| 144 | * |
| 145 | * @discussion |
| 146 | * Returns zero if the two buffers are identical after applying the byte |
| 147 | * masks, otherwise non-zero. |
| 148 | * |
| 149 | * @param src1 first 64-byte input buffer |
| 150 | * @param src2 second 64-byte input buffer |
| 151 | * @param byte_mask 64-byte byte mask applied before comparision |
| 152 | */ |
| 153 | .globl _os_memcmp_mask_64B |
| 154 | .text |
| 155 | .align 4 |
| 156 | _os_memcmp_mask_64B: |
| 157 | |
| 158 | ld1.16b {v0, v1, v2, v3}, [src1] |
| 159 | ld1.16b {v4, v5, v6, v7}, [src2] |
| 160 | ld1.16b {v16, v17, v18, v19}, [mask] |
| 161 | eor.16b v0, v0, v4 |
| 162 | eor.16b v1, v1, v5 |
| 163 | eor.16b v2, v2, v6 |
| 164 | eor.16b v3, v3, v7 |
| 165 | and.16b v0, v0, v16 |
| 166 | and.16b v1, v1, v17 |
| 167 | and.16b v2, v2, v18 |
| 168 | and.16b v3, v3, v19 |
| 169 | orr.16b v0, v0, v1 |
| 170 | orr.16b v2, v2, v3 |
| 171 | orr.16b v0, v0, v2 |
| 172 | umaxv b0, v0.16b |
| 173 | umov w0, v0.s[0] |
| 174 | |
| 175 | ret lr |
| 176 | |
| 177 | /* |
| 178 | * @abstract Compare 80-byte buffers src1 against src2, applying the byte |
| 179 | * masks to input data before comparison. |
| 180 | * |
| 181 | * @discussion |
| 182 | * Returns zero if the two buffers are identical after applying the byte |
| 183 | * masks, otherwise non-zero. |
| 184 | * |
| 185 | * @param src1 first 80-byte input buffer |
| 186 | * @param src2 second 80-byte input buffer |
| 187 | * @param byte_mask 80-byte byte mask applied before comparision |
| 188 | */ |
| 189 | .globl _os_memcmp_mask_80B |
| 190 | .text |
| 191 | .align 4 |
| 192 | _os_memcmp_mask_80B: |
| 193 | |
| 194 | ld1.16b {v0, v1, v2, v3}, [src1], #64 |
| 195 | ld1.16b {v4}, [src1] |
| 196 | ld1.16b {v16, v17, v18, v19}, [src2], #64 |
| 197 | ld1.16b {v20}, [src2] |
| 198 | ld1.16b {v21, v22, v23, v24}, [mask], #64 |
| 199 | ld1.16b {v25}, [mask] |
| 200 | eor.16b v0, v0, v16 |
| 201 | eor.16b v1, v1, v17 |
| 202 | eor.16b v2, v2, v18 |
| 203 | eor.16b v3, v3, v19 |
| 204 | eor.16b v4, v4, v20 |
| 205 | and.16b v0, v0, v21 |
| 206 | and.16b v1, v1, v22 |
| 207 | and.16b v2, v2, v23 |
| 208 | and.16b v3, v3, v24 |
| 209 | and.16b v4, v4, v25 |
| 210 | orr.16b v0, v0, v1 |
| 211 | orr.16b v2, v2, v3 |
| 212 | orr.16b v0, v0, v2 |
| 213 | orr.16b v0, v0, v4 |
| 214 | umaxv b0, v0.16b |
| 215 | umov w0, v0.s[0] |
| 216 | |
| 217 | ret lr |
| 218 | |