-
Notifications
You must be signed in to change notification settings - Fork 129
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #4266 from pmatos/FSTOpt
x87 fst/fld optimization for different addrmodes
- Loading branch information
Showing
19 changed files
with
29,927 additions
and
2,643 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,44 @@ | ||
%ifdef CONFIG | ||
{ | ||
"RegData": { | ||
"RAX": "0x3f800000", | ||
"RBX": "0x3f800000", | ||
"RCX": "0x3f800000", | ||
"RBP": "0x3f800000", | ||
"RDI": "0x3f800000", | ||
"RSP": "0x3f800000" | ||
}, | ||
"MemoryRegions": { | ||
"0xf0000000": "4096" | ||
}, | ||
"Mode": "32BIT" | ||
} | ||
%endif | ||
|
||
section .bss | ||
base resb 4096 | ||
|
||
section .text | ||
|
||
; Setup | ||
fld1 | ||
lea edx, [rel base] | ||
mov esi, 0x64 | ||
|
||
; Test fst | ||
fst dword [edx] | ||
fst dword [edx + 0xa] | ||
fst dword [edx + esi] | ||
fst dword [edx + esi * 4] | ||
fst dword [edx + esi + 0xa] | ||
fst dword [edx + esi * 4 + 0xa] | ||
|
||
; Result check | ||
mov eax, dword [edx] | ||
mov ebx, dword [edx + 0xa] | ||
mov ecx, dword [edx + esi] | ||
mov ebp, dword [edx + esi * 4] | ||
mov edi, dword [edx + esi + 0xa] | ||
mov esp, dword [edx + esi * 4 + 0xa] | ||
|
||
hlt |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
%ifdef CONFIG | ||
{ | ||
"RegData": { | ||
"MM7": ["0x8000000000000000", "0x4000"] | ||
} | ||
} | ||
%endif | ||
|
||
lea rdx, [rel data] | ||
fld tword [rdx + 8 * 0] | ||
|
||
lea rdx, [rel data2] | ||
lea rax, [rdx + 8 * 0] | ||
fstp tword [rax] | ||
fld tword [rdx + 8 * 0] | ||
|
||
hlt | ||
|
||
align 8 | ||
data: | ||
dt 2.0 | ||
dq 0 | ||
data2: | ||
dt 0.0 | ||
dq 0 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,43 @@ | ||
%ifdef CONFIG | ||
{ | ||
"RegData": { | ||
"RAX": "0x3f800000", | ||
"RBX": "0x3f800000", | ||
"RCX": "0x3f800000", | ||
"R8": "0x3f800000", | ||
"R9": "0x3f800000", | ||
"R10": "0x3f800000" | ||
}, | ||
"MemoryRegions": { | ||
"0x100000000": "4096" | ||
} | ||
} | ||
%endif | ||
|
||
section .bss | ||
base resb 4096 | ||
|
||
section .text | ||
|
||
; Setup | ||
fld1 | ||
lea rdx, [rel base] | ||
mov rsi, 0x64 | ||
|
||
; Test fst | ||
fst dword [rdx] | ||
fst dword [rdx + 0xa] | ||
fst dword [rdx + rsi] | ||
fst dword [rdx + rsi * 4] | ||
fst dword [rdx + rsi + 0xa] | ||
fst dword [rdx + rsi * 4 + 0xa] | ||
|
||
; Result check | ||
mov eax, dword [rdx] | ||
mov ebx, dword [rdx + 0xa] | ||
mov ecx, dword [rdx + rsi] | ||
mov r8d, dword [rdx + rsi * 4] | ||
mov r9d, dword [rdx + rsi + 0xa] | ||
mov r10d, dword [rdx + rsi * 4 + 0xa] | ||
|
||
hlt |
Oops, something went wrong.