Clean up x86_64 asm

This commit is contained in:
Natt Akuma 2024-02-02 04:33:20 +07:00
parent 17d8258d2e
commit 56b489c095

52
extern/ESFMu/esfm.c vendored
View file

@ -1754,7 +1754,7 @@ ESFM_process_feedback(esfm_chip *chip)
int32_t wave_out, wave_last; int32_t wave_out, wave_last;
int32_t phase_feedback; int32_t phase_feedback;
uint19 regressed_phase; uint19 regressed_phase;
int iter_counter; uint32_t iter_counter;
uint3 waveform; uint3 waveform;
uint3 mod_in_shift; uint3 mod_in_shift;
uint32_t phase, phase_acc; uint32_t phase, phase_acc;
@ -1781,30 +1781,30 @@ ESFM_process_feedback(esfm_chip *chip)
// ASM optimizaions! // ASM optimizaions!
#if defined(__GNUC__) && defined(__x86_64__) #if defined(__GNUC__) && defined(__x86_64__)
asm ( asm (
"movzbq %b[wave], %%r8 \n\t" "movzbq %[wave], %%r8 \n\t"
"shll $11, %%r8d \n\t" "shll $11, %%r8d \n\t"
"leaq %[sinrom], %%rax \n\t" "leaq %[sinrom], %%rax \n\t"
"addq %%rax, %%r8 \n\t" "addq %%rax, %%r8 \n\t"
"leaq %[exprom], %%r9 \n\t" "leaq %[exprom], %%r9 \n\t"
"movl %k[eg_out], %%r10d \n\t" "movzwl %[eg_out], %%r10d \n\t"
"shll $3, %%r10d \n\t" "shll $3, %%r10d \n\t"
"xorl %%r11d, %%r11d \n\t" "xorl %%r11d, %%r11d \n\t"
"movl %%r11d, %k[out] \n\t" "movl %%r11d, %[out] \n\t"
"movw $29, %%dx \n" "movl $29, %%edx \n"
"1: \n\t" "1: \n\t"
// phase_feedback = (wave_out + wave_last) >> 2; // phase_feedback = (wave_out + wave_last) >> 2;
"movl %k[out], %k[p_fb] \n\t" "movl %[out], %[p_fb] \n\t"
"addl %%r11d, %k[p_fb] \n\t" "addl %%r11d, %[p_fb] \n\t"
"sarl $2, %k[p_fb] \n\t" "sarl $2, %[p_fb] \n\t"
// wave_last = wave_out // wave_last = wave_out
"movl %k[out], %%r11d \n\t" "movl %[out], %%r11d \n\t"
// phase = phase_feedback >> mod_in_shift; // phase = phase_feedback >> mod_in_shift;
"movl %k[p_fb], %%ebx \n\t" "movl %[p_fb], %%eax \n\t"
"movb %b[mod_in], %%cl \n\t" "movb %[mod_in], %%cl \n\t"
"sarl %%cl, %%ebx \n\t" "sarl %%cl, %%eax \n\t"
// phase += phase_acc >> 9; // phase += phase_acc >> 9;
"movl %k[p_acc], %%eax \n\t" "movl %[p_acc], %%ebx \n\t"
"shrl $9, %%eax \n\t" "sarl $9, %%ebx \n\t"
"addl %%ebx, %%eax \n\t" "addl %%ebx, %%eax \n\t"
// lookup = logsinrom[(waveform << 10) | (phase & 0x3ff)]; // lookup = logsinrom[(waveform << 10) | (phase & 0x3ff)];
"andq $0x3ff, %%rax \n\t" "andq $0x3ff, %%rax \n\t"
@ -1820,26 +1820,26 @@ ESFM_process_feedback(esfm_chip *chip)
// wave_out = exprom[level & 0xff] >> (level >> 8); // wave_out = exprom[level & 0xff] >> (level >> 8);
"movb %%ah, %%cl \n\t" "movb %%ah, %%cl \n\t"
"movzbl %%al, %%eax \n\t" "movzbl %%al, %%eax \n\t"
"movzwl (%%r9, %%rax, 2), %k[out] \n\t" "movzwl (%%r9, %%rax, 2), %[out] \n\t"
"shrl %%cl, %k[out] \n\t" "shrl %%cl, %[out] \n\t"
// if (lookup & 0x8000) wave_out = -wave_out; // if (lookup & 0x8000) wave_out = -wave_out;
// in other words, lookup is negative // in other words, lookup is negative
"movl %k[out], %%ecx \n\t" "movl %[out], %%ecx \n\t"
"negl %%ecx \n\t" "negl %%ecx \n\t"
"testw %%bx, %%bx \n\t" "testw %%bx, %%bx \n\t"
"cmovsl %%ecx, %k[out] \n\t" "cmovsl %%ecx, %[out] \n\t"
// phase_acc += phase_offset // phase_acc += phase_offset
"addl %k[p_off], %k[p_acc] \n\t" "addl %[p_off], %[p_acc] \n\t"
// loop // loop
"decw %%dx \n\t" "decl %%edx \n\t"
"jne 1b \n\t" "jne 1b \n\t"
: [p_fb] "=&r" (phase_feedback), : [p_fb] "=&r" (phase_feedback),
[p_acc] "+r" (phase_acc), [p_acc] "+r" (phase_acc),
[out] "+r" (wave_out) [out] "=&r" (wave_out)
: [p_off] "g" ((uint32_t)phase_offset), : [p_off] "r" (phase_offset),
[mod_in] "g" ((uint8_t)mod_in_shift), [mod_in] "r" (mod_in_shift),
[wave] "g" ((uint8_t)waveform), [wave] "r" (waveform),
[eg_out] "g" ((uint32_t)eg_output), [eg_out] "r" (eg_output),
[sinrom] "m" (logsinrom), [sinrom] "m" (logsinrom),
[exprom] "m" (exprom) [exprom] "m" (exprom)
: "cc", "ax", "bx", "cx", "dx", "r8", "r9", "r10", "r11" : "cc", "ax", "bx", "cx", "dx", "r8", "r9", "r10", "r11"
@ -1847,7 +1847,7 @@ ESFM_process_feedback(esfm_chip *chip)
#else #else
wave_out = 0; wave_out = 0;
wave_last = 0; wave_last = 0;
for (iter_counter = 28; iter_counter >= 0; iter_counter--) for (iter_counter = 0; iter_counter < 29; iter_counter++)
{ {
phase_feedback = (wave_out + wave_last) >> 2; phase_feedback = (wave_out + wave_last) >> 2;
wave_last = wave_out; wave_last = wave_out;