3 // Copyright 2018 The Go Authors. All rights reserved.
4 // Use of this source code is governed by a BSD-style
5 // license that can be found in the LICENSE file.
11 // ----------------------- //
12 // bits.LeadingZeros //
13 // ----------------------- //
15 func LeadingZeros(n uint) int {
18 // arm:"CLZ" arm64:"CLZ"
21 return bits.LeadingZeros(n)
24 func LeadingZeros64(n uint64) int {
27 // arm:"CLZ" arm64:"CLZ"
30 return bits.LeadingZeros64(n)
33 func LeadingZeros32(n uint32) int {
34 // amd64:"BSRQ","LEAQ",-"CMOVQEQ"
36 // arm:"CLZ" arm64:"CLZW"
39 return bits.LeadingZeros32(n)
42 func LeadingZeros16(n uint16) int {
43 // amd64:"BSRL","LEAL",-"CMOVQEQ"
45 // arm:"CLZ" arm64:"CLZ"
48 return bits.LeadingZeros16(n)
51 func LeadingZeros8(n uint8) int {
52 // amd64:"BSRL","LEAL",-"CMOVQEQ"
54 // arm:"CLZ" arm64:"CLZ"
57 return bits.LeadingZeros8(n)
64 func Len(n uint) int {
67 // arm:"CLZ" arm64:"CLZ"
73 func Len64(n uint64) int {
76 // arm:"CLZ" arm64:"CLZ"
82 func Len32(n uint32) int {
83 // amd64:"BSRQ","LEAQ",-"CMOVQEQ"
85 // arm:"CLZ" arm64:"CLZ"
91 func Len16(n uint16) int {
92 // amd64:"BSRL","LEAL",-"CMOVQEQ"
94 // arm:"CLZ" arm64:"CLZ"
100 func Len8(n uint8) int {
101 // amd64:"BSRL","LEAL",-"CMOVQEQ"
103 // arm:"CLZ" arm64:"CLZ"
109 // -------------------- //
111 // -------------------- //
113 func OnesCount(n uint) int {
114 // amd64:"POPCNTQ",".*x86HasPOPCNT"
115 // arm64:"VCNT","VUADDLV"
120 return bits.OnesCount(n)
123 func OnesCount64(n uint64) int {
124 // amd64:"POPCNTQ",".*x86HasPOPCNT"
125 // arm64:"VCNT","VUADDLV"
130 return bits.OnesCount64(n)
133 func OnesCount32(n uint32) int {
134 // amd64:"POPCNTL",".*x86HasPOPCNT"
135 // arm64:"VCNT","VUADDLV"
140 return bits.OnesCount32(n)
143 func OnesCount16(n uint16) int {
144 // amd64:"POPCNTL",".*x86HasPOPCNT"
145 // arm64:"VCNT","VUADDLV"
150 return bits.OnesCount16(n)
153 func OnesCount8(n uint8) int {
158 return bits.OnesCount8(n)
161 // ----------------------- //
162 // bits.ReverseBytes //
163 // ----------------------- //
165 func ReverseBytes(n uint) uint {
169 return bits.ReverseBytes(n)
172 func ReverseBytes64(n uint64) uint64 {
176 return bits.ReverseBytes64(n)
179 func ReverseBytes32(n uint32) uint32 {
183 return bits.ReverseBytes32(n)
186 func ReverseBytes16(n uint16) uint16 {
188 // arm64:"REV16W",-"UBFX",-"ORR"
189 // arm/5:"SLL","SRL","ORR"
192 return bits.ReverseBytes16(n)
195 // --------------------- //
196 // bits.RotateLeft //
197 // --------------------- //
199 func RotateLeft64(n uint64) uint64 {
206 return bits.RotateLeft64(n, 37)
209 func RotateLeft32(n uint32) uint32 {
210 // amd64:"ROLL" 386:"ROLL"
211 // arm:`MOVW\tR[0-9]+@>23`
216 return bits.RotateLeft32(n, 9)
219 func RotateLeft16(n uint16) uint16 {
220 // amd64:"ROLW" 386:"ROLW"
221 return bits.RotateLeft16(n, 5)
224 func RotateLeft8(n uint8) uint8 {
225 // amd64:"ROLB" 386:"ROLB"
226 return bits.RotateLeft8(n, 5)
229 func RotateLeftVariable(n uint, m int) uint {
235 return bits.RotateLeft(n, m)
238 func RotateLeftVariable64(n uint64, m int) uint64 {
244 return bits.RotateLeft64(n, m)
247 func RotateLeftVariable32(n uint32, m int) uint32 {
248 // arm:`MOVW\tR[0-9]+@>R[0-9]+`
254 return bits.RotateLeft32(n, m)
257 // ------------------------ //
258 // bits.TrailingZeros //
259 // ------------------------ //
261 func TrailingZeros(n uint) int {
262 // amd64:"BSFQ","MOVL\t\\$64","CMOVQEQ"
264 // arm64:"RBIT","CLZ"
266 // ppc64/power8:"ANDN","POPCNTD"
267 // ppc64le/power8:"ANDN","POPCNTD"
268 // ppc64/power9: "CNTTZD"
269 // ppc64le/power9: "CNTTZD"
271 return bits.TrailingZeros(n)
274 func TrailingZeros64(n uint64) int {
275 // amd64:"BSFQ","MOVL\t\\$64","CMOVQEQ"
276 // arm64:"RBIT","CLZ"
278 // ppc64/power8:"ANDN","POPCNTD"
279 // ppc64le/power8:"ANDN","POPCNTD"
280 // ppc64/power9: "CNTTZD"
281 // ppc64le/power9: "CNTTZD"
283 return bits.TrailingZeros64(n)
286 func TrailingZeros32(n uint32) int {
287 // amd64:"BTSQ\\t\\$32","BSFQ"
289 // arm64:"RBITW","CLZW"
290 // s390x:"FLOGR","MOVWZ"
291 // ppc64/power8:"ANDN","POPCNTW"
292 // ppc64le/power8:"ANDN","POPCNTW"
293 // ppc64/power9: "CNTTZW"
294 // ppc64le/power9: "CNTTZW"
296 return bits.TrailingZeros32(n)
299 func TrailingZeros16(n uint16) int {
300 // amd64:"BSFL","BTSL\\t\\$16"
302 // arm:"ORR\t\\$65536","CLZ",-"MOVHU\tR"
303 // arm64:"ORR\t\\$65536","RBITW","CLZW",-"MOVHU\tR",-"RBIT\t",-"CLZ\t"
304 // s390x:"FLOGR","OR\t\\$65536"
305 // ppc64/power8:"POPCNTD","OR\\t\\$65536"
306 // ppc64le/power8:"POPCNTD","OR\\t\\$65536"
307 // ppc64/power9:"CNTTZD","OR\\t\\$65536"
308 // ppc64le/power9:"CNTTZD","OR\\t\\$65536"
310 return bits.TrailingZeros16(n)
313 func TrailingZeros8(n uint8) int {
314 // amd64:"BSFL","BTSL\\t\\$8"
315 // arm:"ORR\t\\$256","CLZ",-"MOVBU\tR"
316 // arm64:"ORR\t\\$256","RBITW","CLZW",-"MOVBU\tR",-"RBIT\t",-"CLZ\t"
317 // s390x:"FLOGR","OR\t\\$256"
319 return bits.TrailingZeros8(n)
322 // IterateBitsNN checks special handling of TrailingZerosNN when the input is known to be non-zero.
324 func IterateBits(n uint) int {
327 // amd64:"BSFQ",-"CMOVEQ"
328 i += bits.TrailingZeros(n)
334 func IterateBits64(n uint64) int {
337 // amd64:"BSFQ",-"CMOVEQ"
338 i += bits.TrailingZeros64(n)
344 func IterateBits32(n uint32) int {
347 // amd64:"BSFL",-"BTSQ"
348 i += bits.TrailingZeros32(n)
354 func IterateBits16(n uint16) int {
357 // amd64:"BSFL",-"BTSL"
358 // arm64:"RBITW","CLZW",-"ORR"
359 i += bits.TrailingZeros16(n)
365 func IterateBits8(n uint8) int {
368 // amd64:"BSFL",-"BTSL"
369 // arm64:"RBITW","CLZW",-"ORR"
370 i += bits.TrailingZeros8(n)
376 // --------------- //
378 // --------------- //
380 func Add(x, y, ci uint) (r, co uint) {
381 // arm64:"ADDS","ADCS","ADC",-"ADD\t",-"CMP"
382 // amd64:"NEGL","ADCQ","SBBQ","NEGQ"
383 // s390x:"ADDE","ADDC\t[$]-1,"
384 return bits.Add(x, y, ci)
387 func AddC(x, ci uint) (r, co uint) {
388 // arm64:"ADDS","ADCS","ADC",-"ADD\t",-"CMP"
389 // amd64:"NEGL","ADCQ","SBBQ","NEGQ"
390 // s390x:"ADDE","ADDC\t[$]-1,"
391 return bits.Add(x, 7, ci)
394 func AddZ(x, y uint) (r, co uint) {
395 // arm64:"ADDS","ADC",-"ADCS",-"ADD\t",-"CMP"
396 // amd64:"ADDQ","SBBQ","NEGQ",-"NEGL",-"ADCQ"
397 // s390x:"ADDC",-"ADDC\t[$]-1,"
398 return bits.Add(x, y, 0)
401 func AddR(x, y, ci uint) uint {
402 // arm64:"ADDS","ADCS",-"ADD\t",-"CMP"
403 // amd64:"NEGL","ADCQ",-"SBBQ",-"NEGQ"
404 // s390x:"ADDE","ADDC\t[$]-1,"
405 r, _ := bits.Add(x, y, ci)
409 func AddM(p, q, r *[3]uint) {
411 r[0], c = bits.Add(p[0], q[0], c)
412 // arm64:"ADCS",-"ADD\t",-"CMP"
413 // amd64:"ADCQ",-"NEGL",-"SBBQ",-"NEGQ"
414 // s390x:"ADDE",-"ADDC\t[$]-1,"
415 r[1], c = bits.Add(p[1], q[1], c)
416 r[2], c = bits.Add(p[2], q[2], c)
419 func Add64(x, y, ci uint64) (r, co uint64) {
420 // arm64:"ADDS","ADCS","ADC",-"ADD\t",-"CMP"
421 // amd64:"NEGL","ADCQ","SBBQ","NEGQ"
422 // ppc64: "ADDC", "ADDE", "ADDZE"
423 // ppc64le: "ADDC", "ADDE", "ADDZE"
424 // s390x:"ADDE","ADDC\t[$]-1,"
425 return bits.Add64(x, y, ci)
428 func Add64C(x, ci uint64) (r, co uint64) {
429 // arm64:"ADDS","ADCS","ADC",-"ADD\t",-"CMP"
430 // amd64:"NEGL","ADCQ","SBBQ","NEGQ"
431 // ppc64: "ADDC", "ADDE", "ADDZE"
432 // ppc64le: "ADDC", "ADDE", "ADDZE"
433 // s390x:"ADDE","ADDC\t[$]-1,"
434 return bits.Add64(x, 7, ci)
437 func Add64Z(x, y uint64) (r, co uint64) {
438 // arm64:"ADDS","ADC",-"ADCS",-"ADD\t",-"CMP"
439 // amd64:"ADDQ","SBBQ","NEGQ",-"NEGL",-"ADCQ"
440 // ppc64: "ADDC", "ADDE", "ADDZE"
441 // ppc64le: "ADDC", "ADDE", "ADDZE"
442 // s390x:"ADDC",-"ADDC\t[$]-1,"
443 return bits.Add64(x, y, 0)
446 func Add64R(x, y, ci uint64) uint64 {
447 // arm64:"ADDS","ADCS",-"ADD\t",-"CMP"
448 // amd64:"NEGL","ADCQ",-"SBBQ",-"NEGQ"
449 // ppc64: "ADDC", "ADDE", "ADDZE"
450 // ppc64le: "ADDC", "ADDE", "ADDZE"
451 // s390x:"ADDE","ADDC\t[$]-1,"
452 r, _ := bits.Add64(x, y, ci)
455 func Add64M(p, q, r *[3]uint64) {
457 r[0], c = bits.Add64(p[0], q[0], c)
458 // arm64:"ADCS",-"ADD\t",-"CMP"
459 // amd64:"ADCQ",-"NEGL",-"SBBQ",-"NEGQ"
460 // ppc64: "ADDC", "ADDE", "ADDZE"
461 // ppc64le: "ADDC", "ADDE", "ADDZE"
462 // s390x:"ADDE",-"ADDC\t[$]-1,"
463 r[1], c = bits.Add64(p[1], q[1], c)
464 r[2], c = bits.Add64(p[2], q[2], c)
467 // --------------- //
469 // --------------- //
471 func Sub(x, y, ci uint) (r, co uint) {
472 // amd64:"NEGL","SBBQ","NEGQ"
473 // arm64:"NEGS","SBCS","NGC","NEG",-"ADD",-"SUB",-"CMP"
475 return bits.Sub(x, y, ci)
478 func SubC(x, ci uint) (r, co uint) {
479 // amd64:"NEGL","SBBQ","NEGQ"
480 // arm64:"NEGS","SBCS","NGC","NEG",-"ADD",-"SUB",-"CMP"
482 return bits.Sub(x, 7, ci)
485 func SubZ(x, y uint) (r, co uint) {
486 // amd64:"SUBQ","SBBQ","NEGQ",-"NEGL"
487 // arm64:"SUBS","NGC","NEG",-"SBCS",-"ADD",-"SUB\t",-"CMP"
489 return bits.Sub(x, y, 0)
492 func SubR(x, y, ci uint) uint {
493 // amd64:"NEGL","SBBQ",-"NEGQ"
494 // arm64:"NEGS","SBCS",-"NGC",-"NEG\t",-"ADD",-"SUB",-"CMP"
496 r, _ := bits.Sub(x, y, ci)
499 func SubM(p, q, r *[3]uint) {
501 r[0], c = bits.Sub(p[0], q[0], c)
502 // amd64:"SBBQ",-"NEGL",-"NEGQ"
503 // arm64:"SBCS",-"NEGS",-"NGC",-"NEG",-"ADD",-"SUB",-"CMP"
505 r[1], c = bits.Sub(p[1], q[1], c)
506 r[2], c = bits.Sub(p[2], q[2], c)
509 func Sub64(x, y, ci uint64) (r, co uint64) {
510 // amd64:"NEGL","SBBQ","NEGQ"
511 // arm64:"NEGS","SBCS","NGC","NEG",-"ADD",-"SUB",-"CMP"
513 return bits.Sub64(x, y, ci)
516 func Sub64C(x, ci uint64) (r, co uint64) {
517 // amd64:"NEGL","SBBQ","NEGQ"
518 // arm64:"NEGS","SBCS","NGC","NEG",-"ADD",-"SUB",-"CMP"
520 return bits.Sub64(x, 7, ci)
523 func Sub64Z(x, y uint64) (r, co uint64) {
524 // amd64:"SUBQ","SBBQ","NEGQ",-"NEGL"
525 // arm64:"SUBS","NGC","NEG",-"SBCS",-"ADD",-"SUB\t",-"CMP"
527 return bits.Sub64(x, y, 0)
530 func Sub64R(x, y, ci uint64) uint64 {
531 // amd64:"NEGL","SBBQ",-"NEGQ"
532 // arm64:"NEGS","SBCS",-"NGC",-"NEG\t",-"ADD",-"SUB",-"CMP"
534 r, _ := bits.Sub64(x, y, ci)
537 func Sub64M(p, q, r *[3]uint64) {
539 r[0], c = bits.Sub64(p[0], q[0], c)
540 // amd64:"SBBQ",-"NEGL",-"NEGQ"
541 // arm64:"SBCS",-"NEGS",-"NGC",-"NEG",-"ADD",-"SUB",-"CMP"
543 r[1], c = bits.Sub64(p[1], q[1], c)
544 r[2], c = bits.Sub64(p[2], q[2], c)
547 // --------------- //
549 // --------------- //
551 func Mul(x, y uint) (hi, lo uint) {
553 // arm64:"UMULH","MUL"
554 // ppc64:"MULHDU","MULLD"
555 // ppc64le:"MULHDU","MULLD"
556 return bits.Mul(x, y)
559 func Mul64(x, y uint64) (hi, lo uint64) {
561 // arm64:"UMULH","MUL"
562 // ppc64:"MULHDU","MULLD"
563 // ppc64le:"MULHDU","MULLD"
564 return bits.Mul64(x, y)
567 // --------------- //
569 // --------------- //
571 func Div(hi, lo, x uint) (q, r uint) {
573 return bits.Div(hi, lo, x)
576 func Div32(hi, lo, x uint32) (q, r uint32) {
577 // arm64:"ORR","UDIV","MSUB",-"UREM"
578 return bits.Div32(hi, lo, x)
581 func Div64(hi, lo, x uint64) (q, r uint64) {
583 return bits.Div64(hi, lo, x)
586 func Div64degenerate(x uint64) (q, r uint64) {
588 return bits.Div64(0, x, 5)