Files
2026-05-10 01:49:00 +02:00

110 lines
3.4 KiB
ArmAsm

// SPDX-License-Identifier: Apache-2.0
// SPDX-FileCopyrightText: 2026 The Ebitengine Authors
//go:build linux
#include "textflag.h"
#include "go_asm.h"
#include "funcdata.h"
// S390X ELF ABI callbackasm1 implementation
// On entry, R0 contains the callback index (set by callbackasm)
// NOTE: We use R0 instead of R11 because R11 is callee-saved on S390X.
//
// S390X stack frame layout:
// 0(R15) - back chain
// 48(R15) - register save area (R6-R15)
// 160(R15) - parameter area
//
// S390X uses R2-R6 for integer arguments (5 registers) and F0,F2,F4,F6 for floats (4 registers).
//
// Our frame layout (total 264 bytes, 8-byte aligned):
// 0(R15) - back chain
// 48(R15) - saved R6-R15 (done by STMG)
// 160(R15) - callbackArgs struct (32 bytes: index, args, result, stackArgs)
// 192(R15) - args array start
//
// Args array layout:
// - floats F0,F2,F4,F6 (32 bytes)
// - ints R2-R6 (40 bytes)
// Total args array: 72 bytes, ends at 264
//
// Stack args in caller's frame start at old_R15+160
#define FRAME_SIZE 264
#define CB_ARGS 160
#define ARGS_ARRAY 192
#define FLOAT_OFF 0
#define INT_OFF 32
TEXT callbackasm1(SB), NOSPLIT|NOFRAME, $0
NO_LOCAL_POINTERS
// On entry, the trampoline in zcallback_s390x.s left
// the callback index in R0 (NOT R11, since R11 is callee-saved).
// R6 contains the 5th integer argument.
// Save R6-R15 in caller's frame (per S390X ABI) BEFORE allocating our frame
// STMG stores R6's current value (the 5th arg) at 48(R15)
STMG R6, R15, 48(R15)
// Save current stack pointer (will be back chain)
MOVD R15, R1
// Allocate our stack frame
SUB $FRAME_SIZE, R15
MOVD R1, 0(R15) // back chain
// Save R0 (callback index) immediately - it's volatile
MOVD R0, (CB_ARGS+0)(R15)
// Save callback arguments to args array.
// Layout: floats first (F0,F2,F4,F6), then ints (R2-R6)
FMOVD F0, (ARGS_ARRAY+FLOAT_OFF+0*8)(R15)
FMOVD F2, (ARGS_ARRAY+FLOAT_OFF+1*8)(R15)
FMOVD F4, (ARGS_ARRAY+FLOAT_OFF+2*8)(R15)
FMOVD F6, (ARGS_ARRAY+FLOAT_OFF+3*8)(R15)
MOVD R2, (ARGS_ARRAY+INT_OFF+0*8)(R15)
MOVD R3, (ARGS_ARRAY+INT_OFF+1*8)(R15)
MOVD R4, (ARGS_ARRAY+INT_OFF+2*8)(R15)
MOVD R5, (ARGS_ARRAY+INT_OFF+3*8)(R15)
// R6 (5th int arg) was saved at 48(old_R15) by STMG
// old_R15 = current R15 + FRAME_SIZE, so R6 is at 48+FRAME_SIZE(R15) = 312(R15)
MOVD (48+FRAME_SIZE)(R15), R1
MOVD R1, (ARGS_ARRAY+INT_OFF+4*8)(R15)
// Finish setting up callbackArgs struct at CB_ARGS(R15)
// struct { index uintptr; args unsafe.Pointer; result uintptr; stackArgs unsafe.Pointer }
// Note: index was already saved earlier
ADD $ARGS_ARRAY, R15, R1
MOVD R1, (CB_ARGS+8)(R15) // args = address of register args
MOVD $0, (CB_ARGS+16)(R15) // result = 0
// stackArgs points to caller's stack arguments at old_R15+160 = R15+FRAME_SIZE+160
ADD $(FRAME_SIZE+160), R15, R1
MOVD R1, (CB_ARGS+24)(R15) // stackArgs = &caller_stack_args
// Call crosscall2 with arguments in registers:
// R2 = fn (from callbackWrap_call closure)
// R3 = frame (address of callbackArgs)
// R5 = ctxt (0)
MOVD ·callbackWrap_call(SB), R2
MOVD (R2), R2 // dereference closure to get fn
ADD $CB_ARGS, R15, R3 // frame = &callbackArgs
MOVD $0, R5 // ctxt = 0
BL crosscall2(SB)
// Get callback result into R2
MOVD (CB_ARGS+16)(R15), R2
// Deallocate frame
ADD $FRAME_SIZE, R15
// Restore R6-R15 from caller's frame
LMG 48(R15), R6, R15
RET