2 * Copyright (C) 2024 Mikulas Patocka
4 * This file is part of Ajla.
6 * Ajla is free software: you can redistribute it and/or modify it under the
7 * terms of the GNU General Public License as published by the Free Software
8 * Foundation, either version 3 of the License, or (at your option) any later
11 * Ajla is distributed in the hope that it will be useful, but WITHOUT ANY
12 * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
13 * A PARTICULAR PURPOSE. See the GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along with
16 * Ajla. If not, see <https://www.gnu.org/licenses/>.
19 #define OP_SIZE_NATIVE OP_SIZE_8
20 #define OP_SIZE_ADDRESS OP_SIZE_NATIVE
22 #define JMP_LIMIT JMP_SHORTEST
24 #define UNALIGNED_TRAP 1
26 #define ALU_WRITES_FLAGS(alu, im) 0
27 #define ALU1_WRITES_FLAGS(alu) 0
28 #define ROT_WRITES_FLAGS(alu, size, im) 0
29 #define COND_IS_LOGICAL(cond) 0
31 #define ARCH_PARTIAL_ALU(size) 0
32 #define ARCH_IS_3ADDRESS(alu, f) 1
33 #define ARCH_IS_3ADDRESS_IMM(alu, f) 1
34 #define ARCH_IS_3ADDRESS_ROT(alu, size) 1
35 #define ARCH_IS_3ADDRESS_ROT_IMM(alu) 1
36 #define ARCH_IS_2ADDRESS(alu) 1
37 #define ARCH_IS_3ADDRESS_FP 1
38 #define ARCH_HAS_JMP_2REGS(cond) 0
39 #define ARCH_HAS_FLAGS 0
40 #define ARCH_SUPPORTS_TRAPS OS_SUPPORTS_TRAPS
41 #define ARCH_TRAP_BEFORE 0
42 #define ARCH_PREFERS_SX(size) ((size) == OP_SIZE_4)
43 #define ARCH_HAS_BWX cpu_test_feature(CPU_FEATURE_bwx)
44 #define ARCH_HAS_MUL 1
45 #define ARCH_HAS_DIV 0
46 #define ARCH_HAS_ANDN 1
47 #define ARCH_HAS_SHIFTED_ADD(bits) ((bits) == 0 || (bits) == 2 || (bits) == 3)
48 #define ARCH_HAS_BTX(btx, size, cnst) 0
49 #define ARCH_SHIFT_SIZE OP_SIZE_8
50 #define ARCH_BOOL_SIZE OP_SIZE_8
51 #define ARCH_HAS_FP_GP_MOV cpu_test_feature(CPU_FEATURE_fix)
52 #define ARCH_NEEDS_BARRIER thread_needs_barriers
54 #define i_size(size) OP_SIZE_NATIVE
55 #define i_size_rot(size) OP_SIZE_NATIVE
56 #define i_size_cmp(size) OP_SIZE_NATIVE
58 /*#define TIMESTAMP_IN_REGISTER*/
127 #define R_UPCALL R_S1
128 #ifdef TIMESTAMP_IN_REGISTER
129 #define R_TIMESTAMP R_S2
132 #define R_SCRATCH_1 R_A0
133 #define R_SCRATCH_2 R_A1
134 #define R_SCRATCH_3 R_A2
135 #define R_SCRATCH_4 R_A3
136 #define R_SCRATCH_NA_1 R_T0
137 #define R_SCRATCH_NA_2 R_T1
138 #define R_SCRATCH_NA_3 R_T2
140 #define R_SAVED_1 R_S3
141 #define R_SAVED_2 R_S4
150 #define R_OFFSET_IMM R_T3
151 #define R_CONST_IMM R_T4
152 #define R_CMP_RESULT R_T5
154 #define FR_SCRATCH_1 R_F0
155 #define FR_SCRATCH_2 R_F1
156 #define FR_SCRATCH_3 R_F10
158 #define SUPPORTED_FP 0x6
160 #define FRAME_SIZE 0x50
162 static bool reg_is_fp(unsigned reg)
164 return reg >= 0x20 && reg < 0x40;
167 static const uint8_t regs_saved[] = {
168 #ifndef TIMESTAMP_IN_REGISTER
172 static const uint8_t regs_volatile[] = { R_T6, R_T7, R_A4, R_A5, R_T8, R_T9, R_T10, R_T11, R_RA, R_T12, R_AT, R_GP };
173 static const uint8_t fp_saved[] = { 0 };
174 #define n_fp_saved 0U
175 static const uint8_t fp_volatile[] = { R_F11, R_F12, R_F13, R_F14, R_F15, R_F16, R_F17, R_F18, R_F19, R_F20, R_F21, R_F22, R_F23, R_F24, R_F25, R_F26, R_F27, R_F28, R_F29, R_F30 };
176 #define reg_is_saved(r) (((r) >= R_S0 && (r) <= R_FP) || ((r) >= R_F2 && (r) <= R_F9))
178 static bool attr_w gen_load_constant(struct codegen_context *ctx, unsigned reg, uint64_t c)
181 int16_t c1, c2, c3, c4;
186 c2 = (int16_t)(c >> 16);
190 c3 = (int16_t)(c >> 32);
191 c &= ~0xffffffffffffUL;
193 c += 0x1000000000000UL;
194 c4 = (int16_t)(c >> 48);
196 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_ADD, 0);
200 gen_eight((uint64_t)c4 << 16);
204 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_ADD, 0);
212 gen_insn(INSN_ROT, OP_SIZE_NATIVE, ROT_SHL, 0);
219 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_ADD, 0);
223 gen_eight((uint64_t)c2 << 16);
226 if (c1 || r == R_ZERO) {
227 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_ADD, 0);
236 static bool attr_w gen_address(struct codegen_context *ctx, unsigned base, int64_t imm, unsigned purpose, unsigned size)
238 ctx->base_reg = base;
239 ctx->offset_imm = imm;
240 ctx->offset_reg = false;
242 case IMM_PURPOSE_LDR_OFFSET:
243 case IMM_PURPOSE_LDR_SX_OFFSET:
244 case IMM_PURPOSE_STR_OFFSET:
245 case IMM_PURPOSE_VLDR_VSTR_OFFSET:
246 case IMM_PURPOSE_MVI_CLI_OFFSET:
247 if (likely(imm >= -0x8000) && likely(imm < 0x8000))
251 internal(file_line, "gen_address: invalid purpose %u (imm %"PRIxMAX", size %u)", purpose, (uintmax_t)imm, size);
253 g(gen_load_constant(ctx, R_OFFSET_IMM, imm));
254 gen_insn(INSN_ALU, OP_SIZE_ADDRESS, ALU_ADD, 0);
255 gen_one(R_OFFSET_IMM);
256 gen_one(R_OFFSET_IMM);
258 ctx->base_reg = R_OFFSET_IMM;
263 static bool is_direct_const(int64_t imm, unsigned purpose, unsigned size)
265 int64_t imm_copy = imm;
267 case IMM_PURPOSE_STORE_VALUE:
271 case IMM_PURPOSE_SUB:
272 imm_copy = -(uint64_t)imm_copy;
274 case IMM_PURPOSE_ADD:
275 if (likely(imm_copy >= -0x8000) && likely(imm_copy < 0x8000))
277 if (imm_copy & 0xffff)
279 if (likely(imm_copy >= -0x80000000L) && likely(imm_copy < 0x80000000L))
282 case IMM_PURPOSE_CMP:
283 case IMM_PURPOSE_CMP_LOGICAL:
284 case IMM_PURPOSE_AND:
286 case IMM_PURPOSE_XOR:
287 case IMM_PURPOSE_ANDN:
288 case IMM_PURPOSE_TEST:
289 case IMM_PURPOSE_MUL:
290 case IMM_PURPOSE_MOVR:
291 case IMM_PURPOSE_ADD_TRAP:
292 case IMM_PURPOSE_SUB_TRAP:
293 if (imm >= 0 && imm < 256)
297 internal(file_line, "is_direct_const: invalid purpose %u (imm %"PRIxMAX", size %u)", purpose, (uintmax_t)imm, size);
302 static bool attr_w gen_imm(struct codegen_context *ctx, int64_t imm, unsigned purpose, unsigned size)
304 if (is_direct_const(imm, purpose, size)) {
305 ctx->const_imm = imm;
306 ctx->const_reg = false;
308 g(gen_load_constant(ctx, R_CONST_IMM, imm));
309 ctx->const_reg = true;
314 static bool attr_w gen_entry(struct codegen_context *ctx)
316 g(gen_imm(ctx, FRAME_SIZE, IMM_PURPOSE_SUB, OP_SIZE_NATIVE));
317 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_SUB, 0);
322 g(gen_address(ctx, R_SP, 0, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
323 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
324 gen_address_offset();
327 #ifndef TIMESTAMP_IN_REGISTER
328 g(gen_address(ctx, R_SP, 8, IMM_PURPOSE_STR_OFFSET, OP_SIZE_4));
329 gen_insn(INSN_MOV, OP_SIZE_4, 0, 0);
330 gen_address_offset();
334 g(gen_address(ctx, R_SP, 16, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
335 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
336 gen_address_offset();
339 g(gen_address(ctx, R_SP, 24, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
340 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
341 gen_address_offset();
344 g(gen_address(ctx, R_SP, 32, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
345 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
346 gen_address_offset();
349 g(gen_address(ctx, R_SP, 40, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
350 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
351 gen_address_offset();
354 g(gen_address(ctx, R_SP, 48, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
355 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
356 gen_address_offset();
359 g(gen_address(ctx, R_SP, 56, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
360 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
361 gen_address_offset();
364 g(gen_address(ctx, R_SP, 64, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
365 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
366 gen_address_offset();
369 g(gen_address(ctx, R_SP, 72, IMM_PURPOSE_STR_OFFSET, OP_SIZE_NATIVE));
370 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
371 gen_address_offset();
374 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
378 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
382 #ifdef TIMESTAMP_IN_REGISTER
383 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
384 gen_one(R_TIMESTAMP);
388 gen_insn(INSN_JMP_INDIRECT, 0, 0, 0);
394 static bool attr_w gen_escape_arg(struct codegen_context *ctx, ip_t ip, uint32_t escape_label)
396 g(gen_load_constant(ctx, R_SCRATCH_1, (int32_t)ip));
398 gen_insn(INSN_JMP, 0, 0, 0);
399 gen_four(escape_label);
404 static bool attr_w gen_escape(struct codegen_context *ctx)
406 g(gen_address(ctx, R_SP, 72, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
407 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
409 gen_address_offset();
411 g(gen_address(ctx, R_RET0, 0, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
412 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
413 gen_address_offset();
416 g(gen_address(ctx, R_RET0, 8, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_4));
417 gen_insn(INSN_MOV, OP_SIZE_4, 0, 0);
418 gen_address_offset();
419 gen_one(R_SCRATCH_1);
421 g(gen_address(ctx, R_SP, 0, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
422 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
424 gen_address_offset();
426 g(gen_address(ctx, R_SP, 16, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
427 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
429 gen_address_offset();
431 g(gen_address(ctx, R_SP, 24, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
432 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
434 gen_address_offset();
436 g(gen_address(ctx, R_SP, 32, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
437 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
439 gen_address_offset();
441 g(gen_address(ctx, R_SP, 40, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
442 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
444 gen_address_offset();
446 g(gen_address(ctx, R_SP, 48, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
447 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
449 gen_address_offset();
451 g(gen_address(ctx, R_SP, 56, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
452 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
454 gen_address_offset();
456 g(gen_address(ctx, R_SP, 64, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_NATIVE));
457 gen_insn(INSN_MOV, OP_SIZE_NATIVE, 0, 0);
459 gen_address_offset();
461 g(gen_imm(ctx, FRAME_SIZE, IMM_PURPOSE_ADD, OP_SIZE_NATIVE));
462 gen_insn(INSN_ALU, OP_SIZE_NATIVE, ALU_ADD, 0);
467 gen_insn(INSN_RET, 0, 0, 0);
472 static bool attr_w gen_upcall_argument(struct codegen_context attr_unused *ctx, unsigned attr_unused arg)
477 static bool attr_w gen_get_upcall_pointer(struct codegen_context *ctx, unsigned offset, unsigned reg)
479 g(gen_address(ctx, R_UPCALL, offset, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_ADDRESS));
480 gen_insn(INSN_MOV, OP_SIZE_ADDRESS, 0, 0);
482 gen_address_offset();
487 static bool attr_w gen_upcall(struct codegen_context *ctx, unsigned offset, unsigned n_args)
489 g(gen_get_upcall_pointer(ctx, offset, R_T12));
491 gen_insn(INSN_CALL_INDIRECT, OP_SIZE_ADDRESS, 0, 0);
494 g(gen_upcall_end(ctx, n_args));
499 static bool attr_w gen_cmp_test_jmp(struct codegen_context *ctx, unsigned insn, unsigned op_size, unsigned reg1, unsigned reg2, unsigned cond, uint32_t label);
501 static bool attr_w gen_timestamp_test(struct codegen_context *ctx, uint32_t escape_label)
503 g(gen_address(ctx, R_UPCALL, offsetof(struct cg_upcall_vector_s, ts), IMM_PURPOSE_LDR_SX_OFFSET, OP_SIZE_4));
504 gen_insn(INSN_MOVSX, OP_SIZE_4, 0, 0);
505 gen_one(R_SCRATCH_1);
506 gen_address_offset();
508 #ifdef TIMESTAMP_IN_REGISTER
509 g(gen_cmp_test_jmp(ctx, INSN_CMP, OP_SIZE_NATIVE, R_SCRATCH_1, R_TIMESTAMP, COND_NE, escape_label));
511 g(gen_address(ctx, R_SP, 8, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_4));
512 gen_insn(INSN_MOVSX, OP_SIZE_4, 0, 0);
513 gen_one(R_SCRATCH_2);
514 gen_address_offset();
516 g(gen_cmp_test_jmp(ctx, INSN_CMP, OP_SIZE_NATIVE, R_SCRATCH_1, R_SCRATCH_2, COND_NE, escape_label));