mirror of
https://git.wownero.com/wownero/RandomWOW.git
synced 2024-12-22 07:48:54 +00:00
Use values from configuration.h in assembly code
This commit is contained in:
parent
03dd2f397f
commit
c1314dc2a2
2
makefile
2
makefile
@ -88,7 +88,7 @@ $(OBJDIR)/jit_compiler_x86.o: $(SRCDIR)/jit_compiler_x86.cpp $(SRCDIR)/jit_compi
|
|||||||
$(SRCDIR)/superscalar_program.hpp $(SRCDIR)/instruction.hpp $(SRCDIR)/blake2_generator.hpp \
|
$(SRCDIR)/superscalar_program.hpp $(SRCDIR)/instruction.hpp $(SRCDIR)/blake2_generator.hpp \
|
||||||
$(SRCDIR)/program.hpp $(SRCDIR)/reciprocal.h $(SRCDIR)/virtual_memory.hpp \
|
$(SRCDIR)/program.hpp $(SRCDIR)/reciprocal.h $(SRCDIR)/virtual_memory.hpp \
|
||||||
$(SRCDIR)/instruction_weights.hpp
|
$(SRCDIR)/instruction_weights.hpp
|
||||||
$(OBJDIR)/jit_compiler_x86_static.o: $(SRCDIR)/jit_compiler_x86_static.S \
|
$(OBJDIR)/jit_compiler_x86_static.o: $(SRCDIR)/jit_compiler_x86_static.S $(SRCDIR)/configuration.h \
|
||||||
$(SRCDIR)/asm/program_prologue_linux.inc $(SRCDIR)/asm/program_xmm_constants.inc \
|
$(SRCDIR)/asm/program_prologue_linux.inc $(SRCDIR)/asm/program_xmm_constants.inc \
|
||||||
$(SRCDIR)/asm/program_loop_load.inc $(SRCDIR)/asm/program_read_dataset.inc \
|
$(SRCDIR)/asm/program_loop_load.inc $(SRCDIR)/asm/program_read_dataset.inc \
|
||||||
$(SRCDIR)/asm/program_read_dataset_sshash_init.inc \
|
$(SRCDIR)/asm/program_read_dataset_sshash_init.inc \
|
||||||
|
49
src/asm/configuration.asm
Normal file
49
src/asm/configuration.asm
Normal file
@ -0,0 +1,49 @@
|
|||||||
|
; File start: ..\src\configuration.h
|
||||||
|
RANDOMX_ARGON_MEMORY EQU 262144t
|
||||||
|
RANDOMX_ARGON_ITERATIONS EQU 3t
|
||||||
|
RANDOMX_ARGON_LANES EQU 1t
|
||||||
|
RANDOMX_ARGON_SALT TEXTEQU <"RandomX\x03">
|
||||||
|
RANDOMX_CACHE_ACCESSES EQU 8t
|
||||||
|
RANDOMX_SUPERSCALAR_LATENCY EQU 170t
|
||||||
|
RANDOMX_SUPERSCALAR_MAX_SIZE EQU 512t
|
||||||
|
RANDOMX_DATASET_BASE_SIZE EQU 2147483648t
|
||||||
|
RANDOMX_DATASET_EXTRA_SIZE EQU 33554368t
|
||||||
|
RANDOMX_PROGRAM_SIZE EQU 256t
|
||||||
|
RANDOMX_PROGRAM_ITERATIONS EQU 2048t
|
||||||
|
RANDOMX_PROGRAM_COUNT EQU 8t
|
||||||
|
RANDOMX_SCRATCHPAD_L3 EQU 2097152t
|
||||||
|
RANDOMX_SCRATCHPAD_L2 EQU 262144t
|
||||||
|
RANDOMX_SCRATCHPAD_L1 EQU 16384t
|
||||||
|
RANDOMX_JUMP_BITS EQU 8t
|
||||||
|
RANDOMX_JUMP_OFFSET EQU 8t
|
||||||
|
RANDOMX_FREQ_IADD_RS EQU 25t
|
||||||
|
RANDOMX_FREQ_IADD_M EQU 7t
|
||||||
|
RANDOMX_FREQ_ISUB_R EQU 16t
|
||||||
|
RANDOMX_FREQ_ISUB_M EQU 7t
|
||||||
|
RANDOMX_FREQ_IMUL_R EQU 16t
|
||||||
|
RANDOMX_FREQ_IMUL_M EQU 4t
|
||||||
|
RANDOMX_FREQ_IMULH_R EQU 4t
|
||||||
|
RANDOMX_FREQ_IMULH_M EQU 1t
|
||||||
|
RANDOMX_FREQ_ISMULH_R EQU 4t
|
||||||
|
RANDOMX_FREQ_ISMULH_M EQU 1t
|
||||||
|
RANDOMX_FREQ_IMUL_RCP EQU 8t
|
||||||
|
RANDOMX_FREQ_INEG_R EQU 2t
|
||||||
|
RANDOMX_FREQ_IXOR_R EQU 15t
|
||||||
|
RANDOMX_FREQ_IXOR_M EQU 5t
|
||||||
|
RANDOMX_FREQ_IROR_R EQU 10t
|
||||||
|
RANDOMX_FREQ_IROL_R EQU 0t
|
||||||
|
RANDOMX_FREQ_ISWAP_R EQU 4t
|
||||||
|
RANDOMX_FREQ_FSWAP_R EQU 8t
|
||||||
|
RANDOMX_FREQ_FADD_R EQU 20t
|
||||||
|
RANDOMX_FREQ_FADD_M EQU 5t
|
||||||
|
RANDOMX_FREQ_FSUB_R EQU 20t
|
||||||
|
RANDOMX_FREQ_FSUB_M EQU 5t
|
||||||
|
RANDOMX_FREQ_FSCAL_R EQU 6t
|
||||||
|
RANDOMX_FREQ_FMUL_R EQU 20t
|
||||||
|
RANDOMX_FREQ_FDIV_M EQU 4t
|
||||||
|
RANDOMX_FREQ_FSQRT_R EQU 6t
|
||||||
|
RANDOMX_FREQ_CBRANCH EQU 16t
|
||||||
|
RANDOMX_FREQ_CFROUND EQU 1t
|
||||||
|
RANDOMX_FREQ_ISTORE EQU 16t
|
||||||
|
RANDOMX_FREQ_NOP EQU 0t
|
||||||
|
; File end: ..\src\configuration.h
|
@ -1,5 +1,5 @@
|
|||||||
mov rdx, rax
|
mov rdx, rax
|
||||||
and eax, 2097088
|
and eax, RANDOMX_SCRATCHPAD_MASK
|
||||||
lea rcx, [rsi+rax]
|
lea rcx, [rsi+rax]
|
||||||
push rcx
|
push rcx
|
||||||
xor r8, qword ptr [rcx+0]
|
xor r8, qword ptr [rcx+0]
|
||||||
@ -11,7 +11,7 @@
|
|||||||
xor r14, qword ptr [rcx+48]
|
xor r14, qword ptr [rcx+48]
|
||||||
xor r15, qword ptr [rcx+56]
|
xor r15, qword ptr [rcx+56]
|
||||||
ror rdx, 32
|
ror rdx, 32
|
||||||
and edx, 2097088
|
and edx, RANDOMX_SCRATCHPAD_MASK
|
||||||
lea rcx, [rsi+rdx]
|
lea rcx, [rsi+rdx]
|
||||||
push rcx
|
push rcx
|
||||||
cvtdq2pd xmm0, qword ptr [rcx+0]
|
cvtdq2pd xmm0, qword ptr [rcx+0]
|
||||||
|
@ -1,10 +1,10 @@
|
|||||||
xor rbp, rax ;# modify "mx"
|
xor rbp, rax ;# modify "mx"
|
||||||
mov edx, ebp ;# edx = mx
|
mov edx, ebp ;# edx = mx
|
||||||
and edx, 2147483584 ;# align "mx" to the start of a cache line
|
and edx, RANDOMX_DATASET_BASE_MASK
|
||||||
prefetchnta byte ptr [rdi+rdx]
|
prefetchnta byte ptr [rdi+rdx]
|
||||||
ror rbp, 32 ;# swap "ma" and "mx"
|
ror rbp, 32 ;# swap "ma" and "mx"
|
||||||
mov edx, ebp ;# edx = ma
|
mov edx, ebp ;# edx = ma
|
||||||
and edx, 2147483584 ;# align "ma" to the start of a cache line
|
and edx, RANDOMX_DATASET_BASE_MASK
|
||||||
lea rcx, [rdi+rdx] ;# dataset cache line
|
lea rcx, [rdi+rdx] ;# dataset cache line
|
||||||
xor r8, qword ptr [rcx+0]
|
xor r8, qword ptr [rcx+0]
|
||||||
xor r9, qword ptr [rcx+8]
|
xor r9, qword ptr [rcx+8]
|
||||||
|
@ -11,7 +11,7 @@
|
|||||||
xor rbp, rax ;# modify "mx"
|
xor rbp, rax ;# modify "mx"
|
||||||
ror rbp, 32 ;# swap "ma" and "mx"
|
ror rbp, 32 ;# swap "ma" and "mx"
|
||||||
mov ebx, ebp ;# ecx = ma
|
mov ebx, ebp ;# ecx = ma
|
||||||
and ebx, 2147483584 ;# align "ma" to the start of a cache line
|
and ebx, RANDOMX_DATASET_BASE_MASK
|
||||||
shr ebx, 6 ;# ebx = Dataset block number
|
shr ebx, 6 ;# ebx = Dataset block number
|
||||||
;# add ebx, datasetOffset / 64
|
;# add ebx, datasetOffset / 64
|
||||||
;# call 32768
|
;# call 32768
|
@ -1,4 +1,4 @@
|
|||||||
and rbx, 4194303
|
and rbx, RANDOMX_CACHE_MASK
|
||||||
shl rbx, 6
|
shl rbx, 6
|
||||||
add rbx, rdi
|
add rbx, rdi
|
||||||
prefetchnta byte ptr [rbx]
|
prefetchnta byte ptr [rbx]
|
@ -20,7 +20,7 @@ along with RandomX. If not, see<http://www.gnu.org/licenses/>.
|
|||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
//Cache size in KiB. Must be a power of 2.
|
//Cache size in KiB. Must be a power of 2.
|
||||||
#define RANDOMX_ARGON_MEMORY (256 * 1024)
|
#define RANDOMX_ARGON_MEMORY 262144
|
||||||
|
|
||||||
//Number of Argon2d iterations for Cache initialization
|
//Number of Argon2d iterations for Cache initialization
|
||||||
#define RANDOMX_ARGON_ITERATIONS 3
|
#define RANDOMX_ARGON_ITERATIONS 3
|
||||||
@ -41,7 +41,7 @@ along with RandomX. If not, see<http://www.gnu.org/licenses/>.
|
|||||||
#define RANDOMX_SUPERSCALAR_MAX_SIZE 512
|
#define RANDOMX_SUPERSCALAR_MAX_SIZE 512
|
||||||
|
|
||||||
//Dataset base size in bytes. Must be a power of 2.
|
//Dataset base size in bytes. Must be a power of 2.
|
||||||
#define RANDOMX_DATASET_BASE_SIZE (2ULL * 1024 * 1024 * 1024)
|
#define RANDOMX_DATASET_BASE_SIZE 2147483648
|
||||||
|
|
||||||
//Dataset extra size. Must be divisible by 64.
|
//Dataset extra size. Must be divisible by 64.
|
||||||
#define RANDOMX_DATASET_EXTRA_SIZE 33554368
|
#define RANDOMX_DATASET_EXTRA_SIZE 33554368
|
||||||
@ -56,13 +56,13 @@ along with RandomX. If not, see<http://www.gnu.org/licenses/>.
|
|||||||
#define RANDOMX_PROGRAM_COUNT 8
|
#define RANDOMX_PROGRAM_COUNT 8
|
||||||
|
|
||||||
//Scratchpad L3 size in bytes. Must be a power of 2.
|
//Scratchpad L3 size in bytes. Must be a power of 2.
|
||||||
#define RANDOMX_SCRATCHPAD_L3 (2 * 1024 * 1024)
|
#define RANDOMX_SCRATCHPAD_L3 2097152
|
||||||
|
|
||||||
//Scratchpad L2 size in bytes. Must be a power of two and less than or equal to RANDOMX_SCRATCHPAD_L3.
|
//Scratchpad L2 size in bytes. Must be a power of two and less than or equal to RANDOMX_SCRATCHPAD_L3.
|
||||||
#define RANDOMX_SCRATCHPAD_L2 (256 * 1024)
|
#define RANDOMX_SCRATCHPAD_L2 262144
|
||||||
|
|
||||||
//Scratchpad L1 size in bytes. Must be a power of two and less than or equal to RANDOMX_SCRATCHPAD_L2.
|
//Scratchpad L1 size in bytes. Must be a power of two and less than or equal to RANDOMX_SCRATCHPAD_L2.
|
||||||
#define RANDOMX_SCRATCHPAD_L1 (16 * 1024)
|
#define RANDOMX_SCRATCHPAD_L1 16384
|
||||||
|
|
||||||
//Jump condition mask size in bits.
|
//Jump condition mask size in bits.
|
||||||
#define RANDOMX_JUMP_BITS 8
|
#define RANDOMX_JUMP_BITS 8
|
||||||
|
@ -44,6 +44,12 @@
|
|||||||
.global DECL(randomx_program_end)
|
.global DECL(randomx_program_end)
|
||||||
.global DECL(randomx_reciprocal_fast)
|
.global DECL(randomx_reciprocal_fast)
|
||||||
|
|
||||||
|
#include "configuration.h"
|
||||||
|
|
||||||
|
#define RANDOMX_SCRATCHPAD_MASK (RANDOMX_SCRATCHPAD_L3-64)
|
||||||
|
#define RANDOMX_DATASET_BASE_MASK (RANDOMX_DATASET_BASE_SIZE-64)
|
||||||
|
#define RANDOMX_CACHE_MASK (RANDOMX_ARGON_MEMORY*16-1)
|
||||||
|
|
||||||
#define db .byte
|
#define db .byte
|
||||||
|
|
||||||
.balign 64
|
.balign 64
|
||||||
|
@ -37,6 +37,12 @@ PUBLIC randomx_sshash_init
|
|||||||
PUBLIC randomx_program_end
|
PUBLIC randomx_program_end
|
||||||
PUBLIC randomx_reciprocal_fast
|
PUBLIC randomx_reciprocal_fast
|
||||||
|
|
||||||
|
include asm/configuration.asm
|
||||||
|
|
||||||
|
RANDOMX_SCRATCHPAD_MASK EQU (RANDOMX_SCRATCHPAD_L3-64)
|
||||||
|
RANDOMX_DATASET_BASE_MASK EQU (RANDOMX_DATASET_BASE_SIZE-64)
|
||||||
|
RANDOMX_CACHE_MASK EQU (RANDOMX_ARGON_MEMORY*16-1)
|
||||||
|
|
||||||
ALIGN 64
|
ALIGN 64
|
||||||
randomx_program_prologue PROC
|
randomx_program_prologue PROC
|
||||||
include asm/program_prologue_win64.inc
|
include asm/program_prologue_win64.inc
|
||||||
|
90
vcxproj/h2inc.ps1
Normal file
90
vcxproj/h2inc.ps1
Normal file
@ -0,0 +1,90 @@
|
|||||||
|
# The MIT License (MIT)
|
||||||
|
#
|
||||||
|
# Copyright (c) .NET Foundation and Contributors
|
||||||
|
#
|
||||||
|
# All rights reserved.
|
||||||
|
#
|
||||||
|
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||||
|
# of this software and associated documentation files (the "Software"), to deal
|
||||||
|
# in the Software without restriction, including without limitation the rights
|
||||||
|
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||||||
|
# copies of the Software, and to permit persons to whom the Software is
|
||||||
|
# furnished to do so, subject to the following conditions:
|
||||||
|
#
|
||||||
|
# The above copyright notice and this permission notice shall be included in all
|
||||||
|
# copies or substantial portions of the Software.
|
||||||
|
#
|
||||||
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||||
|
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||||
|
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||||
|
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||||
|
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||||
|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
||||||
|
# SOFTWARE.
|
||||||
|
|
||||||
|
# C to MASM include file translator
|
||||||
|
# This is replacement for the deprecated h2inc tool that used to be part of VS.
|
||||||
|
|
||||||
|
#
|
||||||
|
# The use of [console]::WriteLine (instead of Write-Output) is intentional.
|
||||||
|
# PowerShell 2.0 (installed by default on Windows 7) wraps lines written with
|
||||||
|
# Write-Output at whatever column width is being used by the current terminal,
|
||||||
|
# even when output is being redirected to a file. We can't have this behavior
|
||||||
|
# because it will cause the generated file to be malformed.
|
||||||
|
#
|
||||||
|
|
||||||
|
Function ProcessFile($filePath) {
|
||||||
|
|
||||||
|
[console]::WriteLine("; File start: $filePath")
|
||||||
|
|
||||||
|
Get-Content $filePath | ForEach-Object {
|
||||||
|
|
||||||
|
if ($_ -match "^\s*#\spragma") {
|
||||||
|
# Ignore pragmas
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
|
if ($_ -match "^\s*#\s*include\s*`"(.*)`"")
|
||||||
|
{
|
||||||
|
# Expand includes.
|
||||||
|
ProcessFile(Join-Path (Split-Path -Parent $filePath) $Matches[1])
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
|
if ($_ -match "^\s*#define\s+(\S+)\s*(.*)")
|
||||||
|
{
|
||||||
|
# Augment #defines with their MASM equivalent
|
||||||
|
$name = $Matches[1]
|
||||||
|
$value = $Matches[2]
|
||||||
|
|
||||||
|
# Note that we do not handle multiline constants
|
||||||
|
|
||||||
|
# Strip comments from value
|
||||||
|
$value = $value -replace "//.*", ""
|
||||||
|
$value = $value -replace "/\*.*\*/", ""
|
||||||
|
|
||||||
|
# Strip whitespaces from value
|
||||||
|
$value = $value -replace "\s+$", ""
|
||||||
|
|
||||||
|
# ignore #defines with arguments
|
||||||
|
if ($name -notmatch "\(") {
|
||||||
|
$HEX_NUMBER_PATTERN = "\b0x(\w+)\b"
|
||||||
|
$DECIMAL_NUMBER_PATTERN = "(-?\b\d+\b)"
|
||||||
|
|
||||||
|
if ($value -match $HEX_NUMBER_PATTERN -or $value -match $DECIMAL_NUMBER_PATTERN) {
|
||||||
|
$value = $value -replace $HEX_NUMBER_PATTERN, "0`$1h" # Convert hex constants
|
||||||
|
$value = $value -replace $DECIMAL_NUMBER_PATTERN, "`$1t" # Convert dec constants
|
||||||
|
[console]::WriteLine("$name EQU $value")
|
||||||
|
} else {
|
||||||
|
[console]::WriteLine("$name TEXTEQU <$value>")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
# [console]::WriteLine("$_")
|
||||||
|
}
|
||||||
|
|
||||||
|
[console]::WriteLine("; File end: $filePath")
|
||||||
|
}
|
||||||
|
|
||||||
|
ProcessFile $args[0]
|
@ -122,6 +122,10 @@
|
|||||||
</AdditionalOptions>
|
</AdditionalOptions>
|
||||||
<StackReserveSize>4194304</StackReserveSize>
|
<StackReserveSize>4194304</StackReserveSize>
|
||||||
</Link>
|
</Link>
|
||||||
|
<PreBuildEvent>
|
||||||
|
<Command>powershell -ExecutionPolicy Bypass -File .\h2inc.ps1 ..\src\configuration.h > ..\src\asm\configuration.asm
|
||||||
|
SET ERRORLEVEL = 0</Command>
|
||||||
|
</PreBuildEvent>
|
||||||
</ItemDefinitionGroup>
|
</ItemDefinitionGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClCompile Include="..\src\allocator.cpp" />
|
<ClCompile Include="..\src\allocator.cpp" />
|
||||||
|
Loading…
Reference in New Issue
Block a user