^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 1) ;; SPDX-License-Identifier: GPL-2.0-or-later
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 2) ;; Copyright (C) 2010 Texas Instruments Incorporated
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 3) ;; Contributed by Mark Salter <msalter@redhat.com>.
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 4) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 5)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 6) #include <linux/linkage.h>
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 7)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 8) ;; uint64_t __c6xabi_mpyll(uint64_t x, uint64_t y)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 9) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 10) ;; 64x64 multiply
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 11) ;; First compute partial results using 32-bit parts of x and y:
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 12) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 13) ;; b63 b32 b31 b0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 14) ;; -----------------------------
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 15) ;; | 1 | 0 |
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 16) ;; -----------------------------
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 17) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 18) ;; P0 = X0*Y0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 19) ;; P1 = X0*Y1 + X1*Y0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 20) ;; P2 = X1*Y1
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 21) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 22) ;; result = (P2 << 64) + (P1 << 32) + P0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 23) ;;
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 24) ;; Since the result is also 64-bit, we can skip the P2 term.
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 25)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 26) .text
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 27) ENTRY(__c6xabi_mpyll)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 28) mpy32u .m1x A4,B4,A1:A0 ; X0*Y0
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 29) b .s2 B3
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 30) || mpy32u .m2x B5,A4,B1:B0 ; X0*Y1 (don't need upper 32-bits)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 31) || mpy32u .m1x A5,B4,A3:A2 ; X1*Y0 (don't need upper 32-bits)
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 32) nop
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 33) nop
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 34) mv .s1 A0,A4
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 35) add .l1x A2,B0,A5
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 36) add .s1 A1,A5,A5
^8f3ce5b39 (kx 2023-10-28 12:00:06 +0300 37) ENDPROC(__c6xabi_mpyll)