2 * Copyright (C) 2024 Mikulas Patocka
4 * This file is part of Ajla.
6 * Ajla is free software: you can redistribute it and/or modify it under the
7 * terms of the GNU General Public License as published by the Free Software
8 * Foundation, either version 3 of the License, or (at your option) any later
11 * Ajla is distributed in the hope that it will be useful, but WITHOUT ANY
12 * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
13 * A PARTICULAR PURPOSE. See the GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along with
16 * Ajla. If not, see <https://www.gnu.org/licenses/>.
19 #define OP_SIZE_NATIVE OP_SIZE_8
20 #define OP_SIZE_ADDRESS OP_SIZE_8
22 #define JMP_LIMIT JMP_LONG
24 #define UNALIGNED_TRAP 0
26 #define ALU_WRITES_FLAGS(alu, im) 0
27 #define ALU1_WRITES_FLAGS(alu) 0
28 #define ROT_WRITES_FLAGS(alu, size, im) 0
29 #define COND_IS_LOGICAL(cond) 0
31 #define ARCH_PARTIAL_ALU(size) 0
32 #define ARCH_IS_3ADDRESS(alu, f) 1
33 #define ARCH_IS_3ADDRESS_IMM(alu, f) 1
34 #define ARCH_IS_3ADDRESS_ROT(alu, size) 1
35 #define ARCH_IS_3ADDRESS_ROT_IMM(alu) 1
36 #define ARCH_IS_2ADDRESS(alu) 1
37 #define ARCH_IS_3ADDRESS_FP 1
38 #define ARCH_HAS_JMP_2REGS(cond) 0
39 #define ARCH_HAS_FLAGS 1
40 #define ARCH_PREFERS_SX(size) 0
41 #define ARCH_HAS_BWX 1
42 #define ARCH_HAS_MUL 1
43 #define ARCH_HAS_DIV 1
44 #define ARCH_HAS_ANDN 1
45 #define ARCH_HAS_SHIFTED_ADD(bits) 1
46 #define ARCH_HAS_BTX(btx, size, cnst) 0
47 #define ARCH_SHIFT_SIZE OP_SIZE_4
48 #define ARCH_HAS_FP_GP_MOV 1
49 #define ARCH_NEEDS_BARRIER 0
51 #define i_size(size) maximum(size, OP_SIZE_4)
52 #define i_size_rot(size) maximum(size, OP_SIZE_4)
53 #define i_size_cmp(size) maximum(size, OP_SIZE_4)
121 #define FRAME_SIZE 0x60
124 #define R_UPCALL R_27
125 #define R_TIMESTAMP R_26
126 #define R_SAVED_1 R_25
127 #define R_SAVED_2 R_24
128 #define R_SAVED_3 R_23
129 #define R_SAVED_4 R_22
130 #define R_SAVED_5 R_21
131 #define R_SAVED_6 R_20
132 #define R_SAVED_7 R_19
134 #define R_SCRATCH_1 R_0
135 #define R_SCRATCH_2 R_1
136 #define R_SCRATCH_3 R_2
137 #define R_SCRATCH_4 R_3
138 #define R_SCRATCH_NA_1 R_8
139 #define R_SCRATCH_NA_2 R_9
140 #ifdef HAVE_BITWISE_FRAME
141 #define R_SCRATCH_NA_3 R_10
143 #define R_OFFSET_IMM R_16
144 #define R_CONST_IMM R_17
153 #define FR_SCRATCH_1 FR_0
154 #define FR_SCRATCH_2 FR_1
156 #define SUPPORTED_FP 0x6
157 #define SUPPORTED_FP_HALF_CVT 0x1
159 static bool reg_is_fp(unsigned reg)
161 return reg >= 0x20 && reg < 0x40;
164 static const uint8_t regs_saved[] = { R_SAVED_7, R_SAVED_6, R_SAVED_5, R_SAVED_4, R_SAVED_3 };
165 static const uint8_t regs_volatile[] = { R_4, R_5, R_6, R_7,
166 #ifndef HAVE_BITWISE_FRAME
169 R_11, R_12, R_13, R_14, R_15, R_LR };
170 static const uint8_t fp_saved[] = { 0 };
171 #define n_fp_saved 0U
172 static const uint8_t fp_volatile[] = { FR_2, FR_3, FR_4, FR_5, FR_6, FR_7, FR_16, FR_17, FR_18, FR_19, FR_20, FR_21, FR_22, FR_23, FR_24, FR_25, FR_26, FR_27, FR_28, FR_29, FR_30, FR_31 };
173 #define reg_is_saved(r) ((r) >= R_19 && (r) <= R_FP)
180 static const struct logical_imm value_to_code_4_table[] = {
181 #include "arm64-w.inc"
184 static const struct logical_imm value_to_code_8_table[] = {
185 #include "arm64-x.inc"
188 static int16_t value_to_code(uint8_t size, uint64_t value)
191 if (size == OP_SIZE_4) {
192 binary_search(size_t, n_array_elements(value_to_code_4_table), result, value_to_code_4_table[result].value == value, value_to_code_4_table[result].value < value, return -1);
193 return value_to_code_4_table[result].code;
195 binary_search(size_t, n_array_elements(value_to_code_8_table), result, value_to_code_8_table[result].value == value, value_to_code_8_table[result].value < value, return -1);
196 return value_to_code_8_table[result].code;
200 static bool attr_w gen_load_constant(struct codegen_context *ctx, unsigned reg, uint64_t c)
207 code = value_to_code(OP_SIZE_4, c);
209 gen_insn(INSN_ALU, OP_SIZE_4, ALU_OR, 0);
217 code = value_to_code(OP_SIZE_8, c);
219 gen_insn(INSN_ALU, OP_SIZE_8, ALU_OR, 0);
228 if ((int64_t)c < 0) {
229 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
232 gen_eight((c & 0xffff) | 0xffffffffffff0000ULL);
233 if ((c & 0xffff0000ULL) != 0xffff0000ULL) {
234 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_16_32, 0);
238 gen_eight((c >> 16) & 0xffff);
240 if ((c & 0xffff00000000ULL) != 0xffff00000000ULL) {
241 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_32_48, 0);
245 gen_eight((c >> 32) & 0xffff);
247 if ((c & 0xffff000000000000ULL) != 0xffff000000000000ULL) {
248 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_48_64, 0);
252 gen_eight((c >> 48) & 0xffff);
255 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
258 gen_eight(c & 0xffff);
259 if (c & 0xffff0000ULL) {
260 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_16_32, 0);
264 gen_eight((c >> 16) & 0xffff);
266 if (c & 0xffff00000000ULL) {
267 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_32_48, 0);
271 gen_eight((c >> 32) & 0xffff);
273 if (c & 0xffff000000000000ULL) {
274 gen_insn(INSN_MOV_MASK, OP_SIZE_8, MOV_MASK_48_64, 0);
278 gen_eight((c >> 48) & 0xffff);
284 static bool attr_w gen_address(struct codegen_context *ctx, unsigned base, int64_t imm, unsigned purpose, unsigned size)
286 ctx->base_reg = base;
287 ctx->offset_imm = imm;
288 ctx->offset_reg = false;
290 case IMM_PURPOSE_LDR_OFFSET:
291 case IMM_PURPOSE_LDR_SX_OFFSET:
292 case IMM_PURPOSE_STR_OFFSET:
293 case IMM_PURPOSE_VLDR_VSTR_OFFSET:
294 case IMM_PURPOSE_MVI_CLI_OFFSET:
295 if (likely(imm >= -256) && likely(imm <= 255))
297 if (likely(imm >= 0)) {
298 if (unlikely((imm & ((1 << size) - 1)) != 0))
300 if (likely((imm >> size) <= 4095))
304 case IMM_PURPOSE_LDP_STP_OFFSET:
305 if (unlikely((imm & ((1 << size) - 1)) != 0))
307 if (imm / (1 << size) >= -64 && imm / (1 << size) <= 63)
311 internal(file_line, "gen_address: invalid purpose %d", purpose);
313 g(gen_load_constant(ctx, R_OFFSET_IMM, imm));
314 if (purpose == IMM_PURPOSE_LDP_STP_OFFSET) {
315 gen_insn(INSN_ALU, OP_SIZE_ADDRESS, ALU_ADD, 0);
316 gen_one(R_OFFSET_IMM);
317 gen_one(R_OFFSET_IMM);
319 ctx->base_reg = R_OFFSET_IMM;
323 ctx->offset_reg = true;
328 static bool is_direct_const(int64_t imm, unsigned purpose, unsigned size)
331 case IMM_PURPOSE_STORE_VALUE:
335 case IMM_PURPOSE_ADD:
336 case IMM_PURPOSE_SUB:
337 case IMM_PURPOSE_CMP:
338 case IMM_PURPOSE_CMP_LOGICAL:
339 if (imm >= 0 && imm < 4096)
342 case IMM_PURPOSE_AND:
344 case IMM_PURPOSE_XOR:
345 case IMM_PURPOSE_ANDN:
346 case IMM_PURPOSE_TEST:
347 if (value_to_code(size, imm) >= 0)
350 case IMM_PURPOSE_MUL:
353 internal(file_line, "is_direct_const: invalid purpose %u (imm %"PRIxMAX", size %u)", purpose, (uintmax_t)imm, size);
358 static bool attr_w gen_imm(struct codegen_context *ctx, int64_t imm, unsigned purpose, unsigned size)
360 if (is_direct_const(imm, purpose, size)) {
361 ctx->const_imm = imm;
362 ctx->const_reg = false;
364 g(gen_load_constant(ctx, R_CONST_IMM, imm));
365 ctx->const_reg = true;
370 static bool attr_w gen_entry(struct codegen_context *ctx)
372 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
373 gen_one(ARG_ADDRESS_1_PRE_I);
375 gen_eight(-FRAME_SIZE);
379 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
383 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
384 gen_one(ARG_ADDRESS_1);
390 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
391 gen_one(ARG_ADDRESS_1);
395 gen_one(R_TIMESTAMP);
397 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
398 gen_one(ARG_ADDRESS_1);
404 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
405 gen_one(ARG_ADDRESS_1);
411 gen_insn(INSN_STP, OP_SIZE_8, 0, 0);
412 gen_one(ARG_ADDRESS_1);
418 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
422 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
426 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
427 gen_one(R_TIMESTAMP);
430 gen_insn(INSN_JMP_INDIRECT, 0, 0, 0);
436 static bool attr_w gen_escape_arg(struct codegen_context *ctx, ip_t ip, uint32_t escape_label)
438 g(gen_load_constant(ctx, R_RET1, ip));
440 gen_insn(INSN_JMP, 0, 0, 0);
441 gen_four(escape_label);
446 static bool attr_w gen_escape(struct codegen_context *ctx)
448 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
452 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
455 gen_one(ARG_ADDRESS_1);
459 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
462 gen_one(ARG_ADDRESS_1);
466 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
469 gen_one(ARG_ADDRESS_1);
473 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
475 gen_one(R_TIMESTAMP);
476 gen_one(ARG_ADDRESS_1);
480 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
483 gen_one(ARG_ADDRESS_1);
487 gen_insn(INSN_LDP, OP_SIZE_8, 0, 0);
490 gen_one(ARG_ADDRESS_1_POST_I);
492 gen_eight(FRAME_SIZE);
494 gen_insn(INSN_RET, 0, 0, 0);
499 static bool attr_w gen_upcall_argument(struct codegen_context attr_unused *ctx, unsigned attr_unused arg)
504 static bool attr_w gen_upcall(struct codegen_context *ctx, unsigned offset, unsigned n_args)
506 g(gen_address(ctx, R_UPCALL, offset, IMM_PURPOSE_LDR_OFFSET, OP_SIZE_8));
507 gen_insn(INSN_MOV, OP_SIZE_8, 0, 0);
508 gen_one(R_SCRATCH_NA_1);
509 gen_address_offset();
511 gen_insn(INSN_CALL_INDIRECT, OP_SIZE_8, 0, 0);
512 gen_one(R_SCRATCH_NA_1);
514 g(gen_upcall_end(ctx, n_args));
519 static bool attr_w gen_timestamp_test(struct codegen_context *ctx, uint32_t escape_label)
521 g(gen_address(ctx, R_UPCALL, offsetof(struct cg_upcall_vector_s, ts), IMM_PURPOSE_LDR_OFFSET, OP_SIZE_4));
522 gen_insn(INSN_MOV, OP_SIZE_4, 0, 0);
523 gen_one(R_SCRATCH_1);
524 gen_address_offset();
526 gen_insn(INSN_CMP, OP_SIZE_4, 0, 1);
527 gen_one(R_SCRATCH_1);
528 gen_one(R_TIMESTAMP);
530 gen_insn(INSN_JMP_COND, OP_SIZE_4, COND_NE, 0);
531 gen_four(escape_label);