VirtualBox

source: vbox/trunk/src/VBox/Runtime/common/asm/ASMMultU64ByU32DivByU32.asm@ 93115

Last change on this file since 93115 was 93115, checked in by vboxsync, 3 years ago

scm --update-copyright-year

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 4.5 KB
Line 
1; $Id: ASMMultU64ByU32DivByU32.asm 93115 2022-01-01 11:31:46Z vboxsync $
2;; @file
3; IPRT - Assembly Functions, ASMMultU64ByU32DivByU32.
4;
5
6;
7; Copyright (C) 2006-2022 Oracle Corporation
8;
9; This file is part of VirtualBox Open Source Edition (OSE), as
10; available from http://www.virtualbox.org. This file is free software;
11; you can redistribute it and/or modify it under the terms of the GNU
12; General Public License (GPL) as published by the Free Software
13; Foundation, in version 2 as it comes in the "COPYING" file of the
14; VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15; hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16;
17; The contents of this file may alternatively be used under the terms
18; of the Common Development and Distribution License Version 1.0
19; (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20; VirtualBox OSE distribution, in which case the provisions of the
21; CDDL are applicable instead of those of the GPL.
22;
23; You may elect to license modified versions of this file under the
24; terms and conditions of either the GPL or the CDDL or both.
25;
26
27%include "iprt/asmdefs.mac"
28
29
30;;
31; Multiple a 64-bit by a 32-bit integer and divide the result by a 32-bit integer
32; using a 96 bit intermediate result.
33;
34; @returns (u64A * u32B) / u32C.
35; @param u64A/rcx/rdi The 64-bit value.
36; @param u32B/edx/esi The 32-bit value to multiple by A.
37; @param u32C/r8d/edx The 32-bit value to divide A*B by.
38;
39; @cproto DECLASM(uint64_t) ASMMultU64ByU32DivByU32(uint64_t u64A, uint32_t u32B, uint32_t u32C);
40;
41RT_BEGINPROC ASMMultU64ByU32DivByU32
42%if ARCH_BITS == 64
43
44 %ifdef ASM_CALL64_MSC
45 mov rax, rcx ; rax = u64A
46 mov r9d, edx ; should check the specs wrt to the high bits one day...
47 mov r8d, r8d ; be paranoid for the time being.
48 %else
49 mov rax, rdi ; rax = u64A
50 mov r9d, esi ; r9d = u32B
51 mov r8d, edx ; r8d = u32C
52 %endif
53 mul r9
54 div r8
55
56%else ; 16 or 32 bit
57 ;
58 ; This implementation is converted from the GCC inline
59 ; version of the code. Nothing additional has been done
60 ; performance wise.
61 ;
62 %if ARCH_BITS == 16
63 push bp
64 mov bp, sp
65 push eax ; push all return registers to preserve high value (paranoia)
66 push ebx
67 push ecx
68 push edx
69 %endif
70 push esi
71 push edi
72
73 %if ARCH_BITS == 16
74 %define u64A_Lo [bp + 4 + 04h]
75 %define u64A_Hi [bp + 4 + 08h]
76 %define u32B [bp + 4 + 0ch]
77 %define u32C [bp + 4 + 10h]
78 %else
79 %define u64A_Lo [esp + 04h + 08h]
80 %define u64A_Hi [esp + 08h + 08h]
81 %define u32B [esp + 0ch + 08h]
82 %define u32C [esp + 10h + 08h]
83 %endif
84
85 ; Load parameters into registers.
86 mov eax, u64A_Lo
87 mov esi, u64A_Hi
88 mov ecx, u32B
89 mov edi, u32C
90
91 ; The body, just like the in
92 mul ecx ; eax = u64Lo.lo = (u64A.lo * u32B).lo
93 ; edx = u64Lo.hi = (u64A.lo * u32B).hi
94 xchg eax, esi ; esi = u64Lo.lo
95 ; eax = u64A.hi
96 xchg edx, edi ; edi = u64Low.hi
97 ; edx = u32C
98 xchg edx, ecx ; ecx = u32C
99 ; edx = u32B
100 mul edx ; eax = u64Hi.lo = (u64A.hi * u32B).lo
101 ; edx = u64Hi.hi = (u64A.hi * u32B).hi
102 add eax, edi ; u64Hi.lo += u64Lo.hi
103 adc edx, 0 ; u64Hi.hi += carry
104 div ecx ; eax = u64Hi / u32C
105 ; edx = u64Hi % u32C
106 mov edi, eax ; edi = u64Result.hi = u64Hi / u32C
107 mov eax, esi ; eax = u64Lo.lo
108 div ecx ; u64Result.lo
109 mov edx, edi ; u64Result.hi
110
111 ; epilogue
112 pop edi
113 pop esi
114 %if ARCH_BITS == 16
115 ; DX:CX:BX:AX, where DX holds bits 15:0, CX bits 31:16, BX bits 47:32, and AX bits 63:48.
116 mov ax, [bp - 4*4] ; dx = bits 15:0
117 shr eax, 16
118 mov ax, [bp - 3*4] ; cx = bits 31:16
119 mov dx, [bp - 2*4] ; bx = bits 47:32
120 shr edx, 16
121 mov dx, [bp - 1*4] ; ax = bits 63:48
122 pop edx
123 pop ecx
124 pop ebx
125 pop eax
126 leave
127 %endif
128%endif
129 ret
130ENDPROC ASMMultU64ByU32DivByU32
131
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette