1
0

add load uop tests

This commit is contained in:
Rokas Puzonas 2024-02-15 21:03:11 +02:00
parent 42d36ea3fb
commit 01c6e51e6a
6 changed files with 110 additions and 4 deletions

View File

@ -1,8 +1,11 @@
CFLAGS=-lm -g -Wall -O1
build/main: src/main.c src/repetition_tester.c build/multi_nop_loop.o build/write_loops.o src/rprof.h
build/main: src/main.c src/repetition_tester.c build/multi_nop_loop.o build/write_loops.o build/load_uop.o src/rprof.h
mkdir -p build
gcc -o build/main src/main.c build/multi_nop_loop.o build/write_loops.o $(CFLAGS)
gcc -o build/main src/main.c build/multi_nop_loop.o build/write_loops.o build/load_uop.o $(CFLAGS)
build/load_uop.o: src/load_uop.asm
nasm -g -f elf64 -o build/load_uop.o src/load_uop.asm
build/write_loops.o: src/write_loops.asm
nasm -g -f elf64 -o build/write_loops.o src/write_loops.asm

56
src/load_uop.asm Normal file
View File

@ -0,0 +1,56 @@
global mov_load_x1
global mov_load_x2
global mov_load_x3
global mov_load_x4
section .text
; rsi - byte_count
; rdi - buffer
mov_load_x1:
mov rcx, rsi
align 64
.loop:
mov rax, [rdi]
sub rcx, 1
jnle .loop
ret
; rsi - byte_count
; rdi - buffer
mov_load_x2:
mov rcx, rsi
align 64
.loop:
mov rax, [rdi]
mov rax, [rdi]
sub rcx, 2
jnle .loop
ret
; rsi - byte_count
; rdi - buffer
mov_load_x3:
mov rcx, rsi
align 64
.loop:
mov rax, [rdi]
mov rax, [rdi]
mov rax, [rdi]
sub rcx, 3
jnle .loop
ret
; rsi - byte_count
; rdi - buffer
mov_load_x4:
mov rcx, rsi
align 64
.loop:
mov rax, [rdi]
mov rax, [rdi]
mov rax, [rdi]
mov rax, [rdi]
sub rcx, 4
jnle .loop
ret

6
src/load_uop.h Normal file
View File

@ -0,0 +1,6 @@
#include <stdint.h>
void mov_load_x1(uint8_t *buffer, uint64_t byte_count);
void mov_load_x2(uint8_t *buffer, uint64_t byte_count);
void mov_load_x3(uint8_t *buffer, uint64_t byte_count);
void mov_load_x4(uint8_t *buffer, uint64_t byte_count);

View File

@ -14,6 +14,7 @@
#include "main_malloc_read.c"
#include "main_write_backward.c"
#include "main_write_loop.c"
#include "main_load_uop.c"
int main(int argc, char **argv) {
if (argc < 2) {
@ -27,6 +28,8 @@ int main(int argc, char **argv) {
return main_test_write_bytes_asm();
} else if (!strncmp(test_name, "write_all_bytes", sizeof("write_bytes"))) {
return main_test_write_all_bytes();
} else if (!strncmp(test_name, "load_uop", sizeof("load_uop"))) {
return main_test_load_uop();
} else if (!strncmp(test_name, "write_loop", sizeof("write_loop"))) {
return main_test_write_loop();
} else if (!strncmp(test_name, "write_backward", sizeof("write_backward"))) {

40
src/main_load_uop.c Normal file
View File

@ -0,0 +1,40 @@
#include "repetition_tester.c"
#include "load_uop.h"
int main_test_load_uop() {
typedef void (*test_cb)(uint8_t *buffer, uint64_t byte_count);
struct testcase {
char *name;
test_cb cb;
};
struct testcase cases[] = {
{ .name = "mov_load_x1()", .cb = mov_load_x1 },
{ .name = "mov_load_x2()", .cb = mov_load_x2 },
{ .name = "mov_load_x3()", .cb = mov_load_x3 },
{ .name = "mov_load_x4()", .cb = mov_load_x4 },
};
struct repetitor repetitor = {};
repetitor_init(&repetitor);
printf("CPU Frequency: %ldHz (~%.2fGHz)\n", repetitor.cpu_freq, (float)repetitor.cpu_freq/(1000*1000*1000));
uint64_t byte_count = 4096 * 1024;
uint8_t buffer[byte_count];
for (int i = 0; i < ARRAY_LEN(cases); i++) {
struct testcase *testcase = &cases[i];
repetitor_clear(&repetitor);
while (repetitor_repeat(&repetitor, 2)) {
repetitor_start(&repetitor);
repetitor_measure_start(&repetitor);
testcase->cb(buffer, byte_count);
repetitor_measure_stop(&repetitor, byte_count);
repetitor_stop(&repetitor);
}
repetitor_print_results_label(&repetitor, testcase->name);
}
return 0;
}

View File

@ -53,6 +53,4 @@ int main_test_write_loop() {
}
return 0;
return 0;
}