mirror of
https://github.com/ProgramSnail/Lama.git
synced 2025-12-05 22:38:44 +00:00
1532 lines
53 KiB
OCaml
1532 lines
53 KiB
OCaml
open GT
|
|
open Language
|
|
open SM
|
|
open Options
|
|
|
|
(* X86 codegeneration interface *)
|
|
|
|
type compilation_mode_t = { is_debug : bool; target_os : os_t }
|
|
|
|
module Register : sig
|
|
type t
|
|
|
|
val from_names : l8:string -> l64:string -> t
|
|
val from_number : int -> t
|
|
val of_8bit : t -> t
|
|
val of_64bit : t -> t
|
|
val show : t -> string
|
|
end = struct
|
|
(* Other sizes skipped as they are not used *)
|
|
type register_desc = { name8 : string; name64 : string }
|
|
type t = string * register_desc
|
|
|
|
let from_names ~l8 ~l64 = (l64, { name8 = l8; name64 = l64 })
|
|
|
|
let from_number n =
|
|
let name64 = Printf.sprintf "%%r%s" (string_of_int n) in
|
|
let name8 = Printf.sprintf "%%r%sb" (string_of_int n) in
|
|
(name64, { name8; name64 })
|
|
|
|
let of_8bit (_, { name8; name64 }) = (name8, { name8; name64 })
|
|
let of_64bit (_, { name8; name64 }) = (name64, { name8; name64 })
|
|
let show (name, _) = name
|
|
end
|
|
|
|
module Registers : sig
|
|
val rax : Register.t
|
|
val rdi : Register.t
|
|
val rsi : Register.t
|
|
val rdx : Register.t
|
|
val rcx : Register.t
|
|
val rbp : Register.t
|
|
val rsp : Register.t
|
|
val r8 : Register.t
|
|
val r9 : Register.t
|
|
val r10 : Register.t
|
|
val r11 : Register.t
|
|
val r12 : Register.t
|
|
val r13 : Register.t
|
|
val r14 : Register.t
|
|
val r15 : Register.t
|
|
|
|
val argument_registers : Register.t array
|
|
(** All of argument registers are caller-saved *)
|
|
|
|
val extra_caller_saved_registers : Register.t array
|
|
(** Caller saved registers that are not used for arguments *)
|
|
end = struct
|
|
(* Caller-saved special registers *)
|
|
let rax = Register.from_names ~l8:"%al" ~l64:"%rax"
|
|
|
|
(* Caller-saved special and argument registers *)
|
|
let rdx = Register.from_names ~l8:"%dl" ~l64:"%rdx"
|
|
|
|
(* Caller-saved argument registers *)
|
|
let rdi = Register.from_names ~l8:"%dil" ~l64:"%rdi"
|
|
let rsi = Register.from_names ~l8:"%sil" ~l64:"%rsi"
|
|
let rcx = Register.from_names ~l8:"%cl" ~l64:"%rcx"
|
|
let r8 = Register.from_number 8
|
|
let r9 = Register.from_number 9
|
|
|
|
(* Extra caller-saved registers *)
|
|
let r10 = Register.from_number 10
|
|
let r11 = Register.from_number 11
|
|
|
|
(* Callee-saved special registers *)
|
|
let rbp = Register.from_names ~l8:"%bpl" ~l64:"%rbp"
|
|
let rsp = Register.from_names ~l8:"%spl" ~l64:"%rsp"
|
|
|
|
(* r12-15 registes are calee-saved in X86_64
|
|
But we are using them as caller-save for simplicity
|
|
This disallows calling Lama code from C
|
|
While does not affects C calls from Lama *)
|
|
let r12 = Register.from_number 12
|
|
let r13 = Register.from_number 13
|
|
let r14 = Register.from_number 14
|
|
let r15 = Register.from_number 15
|
|
let argument_registers = [| rdi; rsi; rdx; rcx; r8; r9 |]
|
|
let extra_caller_saved_registers = [| r10; r11; r12; r13; r14 |]
|
|
end
|
|
|
|
(* Attributes of the named memory location addressing *)
|
|
|
|
(* External symbols have to be acessed through plt or GOTPCREL.
|
|
While internal just using rip-based addressing. *)
|
|
type externality = I (** Internal *) | E (** External *)
|
|
|
|
(* External functions have to pe acessed through plt.
|
|
While data through GOTPCREL. *)
|
|
type data_kind = F (** Function *) | D (** Data *)
|
|
|
|
(* For functions and string their value is their address.
|
|
While for numbers is the value on this address. *)
|
|
type addressed = A (** Address *) | V (** Value *)
|
|
|
|
(* We need to distinguish the following operand types: *)
|
|
type opnd =
|
|
| R of Register.t (* Hard register *)
|
|
| S of int (* Position on the hardware stack *)
|
|
| M of data_kind * externality * addressed * string
|
|
(* Named memory location *)
|
|
| C of string (* Named constant *)
|
|
| L of int (* Immediate operand *)
|
|
| I of int * opnd (* Indirect operand with offset *)
|
|
|
|
type argument_location = Register of opnd | Stack
|
|
|
|
(* We need to know the word size to calculate offsets correctly *)
|
|
let word_size = 8
|
|
|
|
let as_register opnd =
|
|
match opnd with R r -> r | _ -> failwith "as_register: not a register"
|
|
|
|
let rec show_opnd = function
|
|
| R r -> Printf.sprintf "R %s" (Register.show r)
|
|
| S i -> Printf.sprintf "S %d" i
|
|
| L i -> Printf.sprintf "L %d" i
|
|
| I (i, o) -> Printf.sprintf "I %d %s" i (show_opnd o)
|
|
| C s -> Printf.sprintf "C %s" s
|
|
| M (e, d, a, s) ->
|
|
Printf.sprintf "M %s %s %s %s"
|
|
(match e with F -> "Function" | D -> "Data")
|
|
(match d with I -> "Internal" | E -> "External")
|
|
(match a with A -> "Address" | V -> "Value")
|
|
s
|
|
|
|
(* For convenience we define the following synonyms for the registers: *)
|
|
let rax = R Registers.rax
|
|
let rdx = R Registers.rdx
|
|
let rbp = R Registers.rbp
|
|
let rsp = R Registers.rsp
|
|
let rdi = R Registers.rdi
|
|
let rsi = R Registers.rsi
|
|
let rcx = R Registers.rcx
|
|
let r8 = R Registers.r8
|
|
let r9 = R Registers.r9
|
|
let r10 = R Registers.r10
|
|
let r11 = R Registers.r11
|
|
let r12 = R Registers.r12
|
|
let r13 = R Registers.r13
|
|
let r14 = R Registers.r14
|
|
let r15 = R Registers.r15
|
|
|
|
(* Value that could be used to fill unused stack locations.
|
|
Garbage is not allowed as it will affect GC. *)
|
|
let filler = M (D, I, V, "filler")
|
|
|
|
(* Now x86 instruction (we do not need all of them): *)
|
|
type instr =
|
|
(* copies a value from the first to the second operand *)
|
|
| Mov of opnd * opnd
|
|
(* loads an address of the first operand into the second *)
|
|
| Lea of opnd * opnd
|
|
(* makes a binary operation; note, the first operand
|
|
designates x86 operator, not the source language one *)
|
|
| Binop of string * opnd * opnd
|
|
(* x86 integer division, see instruction set reference *)
|
|
| IDiv of opnd
|
|
(* see instruction set reference *)
|
|
| Cltd
|
|
(* sets a value from flags; the first operand is the
|
|
suffix, which determines the value being set, the
|
|
the second --- (sub)register name *)
|
|
| Set of string * Register.t
|
|
(* pushes the operand on the hardware stack *)
|
|
| Push of opnd
|
|
(* pops from the hardware stack to the operand *)
|
|
| Pop of opnd
|
|
(* call a function by a name *)
|
|
| Call of string
|
|
(* call a function by indirect address *)
|
|
| CallI of opnd
|
|
(* returns from a function *)
|
|
| Ret
|
|
(* a label in the code *)
|
|
| Label of string
|
|
(* a conditional jump *)
|
|
| CJmp of string * string
|
|
(* a non-conditional jump by a name *)
|
|
| Jmp of string
|
|
(* a non-conditional jump by indirect address *)
|
|
| JmpI of opnd
|
|
(* directive *)
|
|
| Meta of string
|
|
(* arithmetic correction: decrement *)
|
|
| Dec of opnd
|
|
(* arithmetic correction: or 0x0001 *)
|
|
| Or1 of opnd
|
|
(* arithmetic correction: shl 1 *)
|
|
| Sal1 of opnd
|
|
(* arithmetic correction: shr 1 *)
|
|
| Sar1 of opnd
|
|
| Repmovsl
|
|
|
|
let stack_offset i =
|
|
if i >= 0 then (i + 1) * word_size else (-i + 1) * word_size
|
|
|
|
(* Instruction printer *)
|
|
let show env instr =
|
|
let rec opnd = function
|
|
| R r -> Register.show r
|
|
| S i ->
|
|
if i >= 0 then Printf.sprintf "-%d(%%rbp)" (stack_offset i)
|
|
else Printf.sprintf "%d(%%rbp)" (stack_offset i)
|
|
| M (_, I, _, s) -> Printf.sprintf "%s(%%rip)" (env#prefixed s)
|
|
| M (F, E, _, s) -> Printf.sprintf "%s(%%rip)" (env#prefixed s)
|
|
| M (D, E, _, s) -> Printf.sprintf "%s@GOTPCREL(%%rip)" (env#prefixed s)
|
|
| C s -> Printf.sprintf "$%s" (env#prefixed s)
|
|
| L i -> Printf.sprintf "$%d" i
|
|
| I (0, x) -> Printf.sprintf "(%s)" (opnd x)
|
|
| I (n, x) -> Printf.sprintf "%d(%s)" n (opnd x)
|
|
in
|
|
let binop = function
|
|
| "+" -> "addq"
|
|
| "-" -> "subq"
|
|
| "*" -> "imulq"
|
|
| "&&" -> "andq"
|
|
| "!!" -> "orq"
|
|
| "^" -> "xorq"
|
|
| "cmp" -> "cmpq"
|
|
| "test" -> "test"
|
|
| _ -> failwith "unknown binary operator"
|
|
in
|
|
match instr with
|
|
| Cltd -> "\tcqo"
|
|
| Set (suf, r) ->
|
|
Printf.sprintf "\tset%s\t%s" suf (Register.show (Register.of_8bit r))
|
|
| IDiv s1 -> Printf.sprintf "\tidivq\t%s" (opnd s1)
|
|
| Binop (op, s1, s2) ->
|
|
Printf.sprintf "\t%s\t%s,\t%s" (binop op) (opnd s1) (opnd s2)
|
|
| Mov ((M (_, _, A, _) as x), y) | Lea (x, y) ->
|
|
Printf.sprintf "\tleaq\t%s,\t%s" (opnd x) (opnd y)
|
|
| Mov (s1, s2) -> Printf.sprintf "\tmovq\t%s,\t%s" (opnd s1) (opnd s2)
|
|
| Push s -> Printf.sprintf "\tpushq\t%s" (opnd s)
|
|
| Pop s -> Printf.sprintf "\tpopq\t%s" (opnd s)
|
|
| Ret -> "\tret"
|
|
| Call p -> Printf.sprintf "\tcall\t%s" (env#prefixed p)
|
|
| CallI o -> Printf.sprintf "\tcall\t*(%s)" (opnd o)
|
|
| Label l -> Printf.sprintf "%s:\n" (env#prefixed l)
|
|
| Jmp l -> Printf.sprintf "\tjmp\t%s" (env#prefixed l)
|
|
| JmpI o -> Printf.sprintf "\tjmp\t*(%s)" (opnd o)
|
|
| CJmp (s, l) -> Printf.sprintf "\tj%s\t%s" s (env#prefixed l)
|
|
| Meta s -> Printf.sprintf "%s\n" s
|
|
| Dec s -> Printf.sprintf "\tdecq\t%s" (opnd s)
|
|
| Or1 s -> Printf.sprintf "\torq\t$0x0001,\t%s" (opnd s)
|
|
| Sal1 s -> Printf.sprintf "\tsalq\t%s" (opnd s)
|
|
| Sar1 s -> Printf.sprintf "\tsarq\t%s" (opnd s)
|
|
| Repmovsl -> Printf.sprintf "\trep movsq\t"
|
|
|
|
(* Most of instructions have constraints on memory operands *)
|
|
let in_memory = function M _ | S _ | I _ -> true | C _ | R _ | L _ -> false
|
|
|
|
let mov x s =
|
|
(* Numeric literals with more than 32 bits cannot be directly moved to memory location *)
|
|
let big_numeric_literal = function
|
|
| L num -> num > 0xFFFFFFFF || num < -0xFFFFFFFF
|
|
| _ -> false
|
|
in
|
|
if x = s then []
|
|
else if
|
|
(in_memory x && in_memory s)
|
|
|| (big_numeric_literal x && (in_memory x || in_memory s))
|
|
then [ Mov (x, rax); Mov (rax, s) ]
|
|
else [ Mov (x, s) ]
|
|
|
|
(* Boxing for numeric values *)
|
|
let box n = (n lsl 1) lor 1
|
|
|
|
(*
|
|
Compile binary operation
|
|
|
|
compile_binop : env -> string -> env * instr list
|
|
*)
|
|
let compile_binop env op =
|
|
let suffix = function
|
|
| "<" -> "l"
|
|
| "<=" -> "le"
|
|
| "==" -> "e"
|
|
| "!=" -> "ne"
|
|
| ">=" -> "ge"
|
|
| ">" -> "g"
|
|
| _ -> failwith "unknown operator"
|
|
in
|
|
let x, y = env#peek2 in
|
|
(* For binary operations requiring no extra register *)
|
|
let without_extra op =
|
|
let _x, env = env#pop in
|
|
(env, op ())
|
|
in
|
|
(* For binary operations requiring rdx *)
|
|
let with_rdx op =
|
|
if not env#rdx_in_use then
|
|
let _x, env = env#pop in
|
|
(env, op rdx)
|
|
else
|
|
let extra, env = env#allocate in
|
|
let _extra, env = env#pop in
|
|
let _x, env = env#pop in
|
|
let code = op rdx in
|
|
(env, [ Mov (rdx, extra) ] @ code @ [ Mov (extra, rdx) ])
|
|
in
|
|
(* For binary operations requiring any extra register *)
|
|
let with_extra op =
|
|
let extra, env = env#allocate in
|
|
let _extra, env = env#pop in
|
|
let _x, env = env#pop in
|
|
if in_memory extra then
|
|
(env, [ Mov (rdx, extra) ] @ op rdx @ [ Mov (extra, rdx) ])
|
|
else (env, op extra)
|
|
in
|
|
match op with
|
|
| "/" ->
|
|
with_rdx (fun rdx ->
|
|
[
|
|
Mov (y, rax);
|
|
Sar1 rax;
|
|
Binop ("^", rdx, rdx);
|
|
Cltd;
|
|
Sar1 x;
|
|
IDiv x;
|
|
Sal1 rax;
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
])
|
|
| "%" ->
|
|
with_rdx (fun rdx ->
|
|
[
|
|
Mov (y, rax);
|
|
Sar1 rax;
|
|
Cltd;
|
|
Sar1 x;
|
|
IDiv x;
|
|
Sal1 rdx;
|
|
Or1 rdx;
|
|
Mov (rdx, y);
|
|
])
|
|
| "<" | "<=" | "==" | "!=" | ">=" | ">" ->
|
|
if in_memory x then
|
|
with_extra (fun extra ->
|
|
[
|
|
Binop ("^", rax, rax);
|
|
Mov (x, extra);
|
|
Binop ("cmp", extra, y);
|
|
Set (suffix op, Registers.rax);
|
|
Sal1 rax;
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
])
|
|
else
|
|
without_extra (fun () ->
|
|
[
|
|
Binop ("^", rax, rax);
|
|
Binop ("cmp", x, y);
|
|
Set (suffix op, Registers.rax);
|
|
Sal1 rax;
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
])
|
|
| "*" ->
|
|
without_extra (fun () ->
|
|
if in_memory y then
|
|
[
|
|
Dec y;
|
|
Mov (x, rax);
|
|
Sar1 rax;
|
|
Binop (op, y, rax);
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
]
|
|
else [ Dec y; Mov (x, rax); Sar1 rax; Binop (op, rax, y); Or1 y ])
|
|
| "&&" ->
|
|
with_extra (fun extra ->
|
|
[
|
|
Dec x;
|
|
Mov (x, rax);
|
|
Binop (op, x, rax);
|
|
Mov (L 0, rax);
|
|
Set ("ne", Registers.rax);
|
|
Dec y;
|
|
Mov (y, extra);
|
|
Binop (op, y, extra);
|
|
Mov (L 0, extra);
|
|
Set ("ne", as_register extra);
|
|
Binop (op, extra, rax);
|
|
Set ("ne", Registers.rax);
|
|
Sal1 rax;
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
])
|
|
| "!!" ->
|
|
without_extra (fun () ->
|
|
[
|
|
Mov (y, rax);
|
|
Sar1 rax;
|
|
Sar1 x;
|
|
Binop (op, x, rax);
|
|
Mov (L 0, rax);
|
|
Set ("ne", Registers.rax);
|
|
Sal1 rax;
|
|
Or1 rax;
|
|
Mov (rax, y);
|
|
])
|
|
| "+" ->
|
|
without_extra (fun () ->
|
|
if in_memory x && in_memory y then
|
|
[ Mov (x, rax); Dec rax; Binop ("+", rax, y) ]
|
|
else [ Binop (op, x, y); Dec y ])
|
|
| "-" ->
|
|
without_extra (fun () ->
|
|
if in_memory x && in_memory y then
|
|
[ Mov (x, rax); Binop (op, rax, y); Or1 y ]
|
|
else [ Binop (op, x, y); Or1 y ])
|
|
| _ ->
|
|
failwith (Printf.sprintf "Unexpected pattern: %s: %d" __FILE__ __LINE__)
|
|
|
|
(* For pointers to be marked by GC as alive they have to be located on the stack.
|
|
As we do not have control where does the C compiler locate them in the moment of GC,
|
|
we have to explicitly locate them on the stack.
|
|
And to the runtime function we are passing a reference to their location. *)
|
|
let safepoint_functions =
|
|
[
|
|
labeled "s__Infix_58";
|
|
labeled "substring";
|
|
labeled "clone";
|
|
labeled_builtin "string";
|
|
labeled "stringcat";
|
|
labeled "string";
|
|
labeled_builtin "closure";
|
|
labeled_builtin "array";
|
|
labeled_builtin "sexp";
|
|
labeled "i__Infix_4343";
|
|
(* "makeArray"; not required as do not have ptr arguments *)
|
|
(* "makeString"; not required as do not have ptr arguments *)
|
|
(* "getEnv", not required as do not have ptr arguments *)
|
|
(* "set_args", not required as do not have ptr arguments *)
|
|
(* Lsprintf, or Bsprintf is an extra dirty hack that probably works *)
|
|
]
|
|
|
|
(* For vararg functions where we pass them in the stdlib function using va_list,
|
|
we have to unbox values to print them correctly.
|
|
For this we have special assemply functions in `printf.S`.
|
|
We additionally pass them amount of arguments to unbox using register r11. *)
|
|
let vararg_functions =
|
|
[
|
|
(labeled "printf", 1);
|
|
(labeled "fprintf", 2);
|
|
(labeled "sprintf", 1);
|
|
(labeled "failure", 1);
|
|
]
|
|
|
|
let compile_call env ?fname nargs tail =
|
|
let fname =
|
|
Option.map
|
|
(fun fname ->
|
|
match fname.[0] with
|
|
| '.' -> labeled_builtin (String.sub fname 1 (String.length fname - 1))
|
|
| _ -> fname)
|
|
fname
|
|
in
|
|
let safepoint_call =
|
|
match fname with
|
|
| Some fname -> List.mem fname safepoint_functions
|
|
| None -> false
|
|
in
|
|
let tail_call_optimization_applicable =
|
|
let allowed_function =
|
|
match fname with
|
|
| Some fname ->
|
|
let is_vararg =
|
|
Option.is_some @@ List.assoc_opt fname vararg_functions
|
|
in
|
|
let is_internal = fname.[0] = 'B' in
|
|
(not is_internal) && not is_vararg
|
|
| None -> true
|
|
in
|
|
let same_arguments_count = env#nargs = nargs in
|
|
tail && allowed_function && same_arguments_count
|
|
in
|
|
let compile_tail_call env fname nargs =
|
|
let rec push_args env acc = function
|
|
| 0 -> (env, acc)
|
|
| n ->
|
|
let x, env = env#pop in
|
|
push_args env (mov x (env#loc (Value.Arg (n - 1))) @ acc) (n - 1)
|
|
in
|
|
let env, pushs = push_args env [] nargs in
|
|
let env, setup_closure =
|
|
match fname with
|
|
| Some _ -> (env, [])
|
|
| None ->
|
|
let closure, env = env#pop in
|
|
(env, [ Mov (closure, r15) ])
|
|
in
|
|
let add_argc_counter = [ Mov (L nargs, r11) ] in
|
|
let jump =
|
|
match fname with Some fname -> [ Jmp fname ] | None -> [ JmpI r15 ]
|
|
in
|
|
let _, env = env#allocate in
|
|
( env,
|
|
pushs
|
|
@ [ Mov (rbp, rsp); Pop rbp ]
|
|
@ setup_closure @ add_argc_counter @ jump )
|
|
in
|
|
let compile_common_call env fname nargs =
|
|
let setup_arguments env nargs =
|
|
let rec pop_arguments env acc = function
|
|
| 0 -> (env, acc)
|
|
| n ->
|
|
let x, env = env#pop in
|
|
pop_arguments env (x :: acc) (n - 1)
|
|
in
|
|
let move_arguments args arg_locs =
|
|
List.fold_left2
|
|
(fun acc arg arg_loc ->
|
|
match arg_loc with
|
|
| Register r -> Mov (arg, r) :: acc
|
|
| Stack -> Push arg :: acc)
|
|
[] args arg_locs
|
|
in
|
|
let env, args = pop_arguments env [] nargs in
|
|
let arg_locs, stack_slots = env#arguments_locations (List.length args) in
|
|
let setup_args_code = move_arguments args arg_locs in
|
|
(stack_slots, env, setup_args_code)
|
|
in
|
|
let protect_registers env =
|
|
let pushr, popr =
|
|
List.split @@ List.map (fun r -> (Push r, Pop r)) env#live_registers
|
|
in
|
|
if env#has_closure then (Push r15 :: pushr, Pop r15 :: popr)
|
|
else (pushr, popr)
|
|
in
|
|
let align_stack saved_registers stack_arguments =
|
|
let aligned = (saved_registers + stack_arguments) mod 2 == 0 in
|
|
if aligned && stack_arguments = 0 then ([], [])
|
|
else if aligned then
|
|
([], [ Binop ("+", L (word_size * stack_arguments), rsp) ])
|
|
else
|
|
( [ Push filler ],
|
|
[ Binop ("+", L (word_size * (1 + stack_arguments)), rsp) ] )
|
|
in
|
|
let setup_closure env =
|
|
match fname with
|
|
| Some _ -> (env, [])
|
|
| None ->
|
|
let closure, env = env#pop in
|
|
(env, [ Mov (closure, r15) ])
|
|
in
|
|
let call env fname =
|
|
match fname with
|
|
| Some fname -> (env, [ Call fname ])
|
|
| None -> (env, [ CallI r15 ])
|
|
in
|
|
let move_result env =
|
|
let y, env = env#allocate in
|
|
(env, [ Mov (rax, y) ])
|
|
in
|
|
let add_argc_counter =
|
|
let argc_before_vararg =
|
|
Option.bind fname (fun fname -> List.assoc_opt fname vararg_functions)
|
|
in
|
|
match argc_before_vararg with
|
|
(* For vararg functions we add counter of only vararg argumnets.
|
|
It is used in assembly to unbox them. *)
|
|
| Some argc -> [ Mov (L (nargs - argc), r11) ]
|
|
(* For all functions in debug mode we add arguments counter.
|
|
It is checked in the prologue of the function. *)
|
|
| None -> [ Mov (L nargs, r11) ]
|
|
in
|
|
let stack_slots, env, setup_args_code = setup_arguments env nargs in
|
|
let push_registers, pop_registers = protect_registers env in
|
|
let align_prologue, align_epilogue =
|
|
align_stack (List.length push_registers) stack_slots
|
|
in
|
|
let env, setup_closure = setup_closure env in
|
|
let env, call = call env fname in
|
|
let env, move_result = move_result env in
|
|
( env,
|
|
push_registers @ align_prologue @ setup_args_code @ setup_closure
|
|
@ add_argc_counter @ call @ align_epilogue @ List.rev pop_registers
|
|
@ move_result )
|
|
in
|
|
let compile_safe_point_call env fname nargs =
|
|
let setup_arguments env nargs =
|
|
let rec pop_arguments env acc = function
|
|
| 0 -> (env, acc)
|
|
| n ->
|
|
let x, env = env#pop in
|
|
pop_arguments env (x :: acc) (n - 1)
|
|
in
|
|
let env, args = pop_arguments env [] nargs in
|
|
let setup_args_code = List.map (fun arg -> Push arg) @@ List.rev args in
|
|
let setup_args_code = setup_args_code @ [ Mov (rsp, rdi) ] in
|
|
let setup_args_code =
|
|
if fname = labeled_builtin "closure" then
|
|
setup_args_code @ [ Mov (L (box (nargs - 1)), rsi) ]
|
|
else if
|
|
fname = labeled_builtin "sexp" || fname = labeled_builtin "array"
|
|
then setup_args_code @ [ Mov (L (box nargs), rsi) ]
|
|
else setup_args_code
|
|
in
|
|
(nargs, env, setup_args_code)
|
|
in
|
|
let protect_registers env =
|
|
let pushr, popr =
|
|
List.split @@ List.map (fun r -> (Push r, Pop r)) env#live_registers
|
|
in
|
|
if env#has_closure then (Push r15 :: pushr, Pop r15 :: popr)
|
|
else (pushr, popr)
|
|
in
|
|
let align_stack saved_registers stack_arguments =
|
|
let aligned = (saved_registers + stack_arguments) mod 2 == 0 in
|
|
if aligned && stack_arguments = 0 then ([], [])
|
|
else if aligned then
|
|
([], [ Binop ("+", L (word_size * stack_arguments), rsp) ])
|
|
else
|
|
( [ Push filler ],
|
|
[ Binop ("+", L (word_size * (1 + stack_arguments)), rsp) ] )
|
|
in
|
|
let call env fname = (env, [ Call fname ]) in
|
|
let move_result env =
|
|
let y, env = env#allocate in
|
|
(env, [ Mov (rax, y) ])
|
|
in
|
|
let stack_slots, env, setup_args_code = setup_arguments env nargs in
|
|
let push_registers, pop_registers = protect_registers env in
|
|
let align_prologue, align_epilogue =
|
|
align_stack (List.length push_registers) stack_slots
|
|
in
|
|
let env, call = call env fname in
|
|
let env, move_result = move_result env in
|
|
( env,
|
|
push_registers @ align_prologue @ setup_args_code @ call @ align_epilogue
|
|
@ List.rev pop_registers @ move_result )
|
|
in
|
|
if safepoint_call then compile_safe_point_call env (Option.get fname) nargs
|
|
else if tail_call_optimization_applicable then
|
|
compile_tail_call env fname nargs
|
|
else compile_common_call env fname nargs
|
|
|
|
let opt_stabs env stabs =
|
|
match env#mode.target_os with Darwin -> [] | Linux -> stabs
|
|
|
|
(* Symbolic stack machine evaluator
|
|
|
|
compile : env -> prg -> env * instr list
|
|
|
|
Take an environment, a stack machine program, and returns a pair ---
|
|
the updated environment and the list of x86 instructions
|
|
*)
|
|
let compile cmd env imports code =
|
|
let rec compile' env scode =
|
|
match scode with
|
|
| [] -> (env, [])
|
|
| instr :: scode' ->
|
|
let stack_state = if env#mode.is_debug then env#show_stack else "" in
|
|
let env', code' =
|
|
if env#is_barrier then
|
|
match instr with
|
|
| LABEL s ->
|
|
if env#has_stack s then
|
|
(env#drop_barrier#retrieve_stack s, [ Label s ])
|
|
else (env#drop_stack, [])
|
|
| FLABEL s -> (env#drop_barrier, [ Label s ])
|
|
| SLABEL s -> (env, [ Label s ])
|
|
| _ -> (env, [])
|
|
else
|
|
match instr with
|
|
| PUBLIC name -> (env#register_public name, [])
|
|
| EXTERN name -> (env#register_extern name, [])
|
|
| IMPORT _ -> (env, [])
|
|
| CLOSURE (name, closure) ->
|
|
let ext = if env#is_external name then E else I in
|
|
let address = M (F, ext, A, name) in
|
|
let l, env = env#allocate in
|
|
let env, push_closure_code =
|
|
List.fold_left
|
|
(fun (env, code) c ->
|
|
let cr, env = env#allocate in
|
|
(env, mov (env#loc c) cr @ code))
|
|
(env, []) closure
|
|
in
|
|
let env, call_code =
|
|
compile_call env ~fname:".closure"
|
|
(1 + List.length closure)
|
|
false
|
|
in
|
|
(env, push_closure_code @ mov address l @ call_code)
|
|
| CONST n ->
|
|
let s, env' = env#allocate in
|
|
(env', mov (L (box n)) s)
|
|
| STRING s ->
|
|
let addr, env = env#string s in
|
|
let l, env = env#allocate in
|
|
let env, call = compile_call env ~fname:".string" 1 false in
|
|
(env, mov addr l @ call)
|
|
| LDA _ ->
|
|
failwith
|
|
"Should not happen. Indirect assignemts are temporarily \
|
|
prohibited."
|
|
(*
|
|
let s, env' = (env#variable x)#allocate in
|
|
let s', env'' = env'#allocate in
|
|
let loc_x = env'#loc x in
|
|
match loc_x with
|
|
| R _ ->
|
|
failwith
|
|
"We are not able to take an address of a register. This \
|
|
is the known limitation of 64-bit compiler. If you \
|
|
encountered this issue, just do not use indirect \
|
|
assignment :("
|
|
| _ ->
|
|
();
|
|
(env'', [ Lea (loc_x, rax); Mov (rax, s); Mov (rax, s') ])*)
|
|
| LD x -> (
|
|
let s, env' = (env#variable x)#allocate in
|
|
( env',
|
|
match s with
|
|
| S _ | M _ -> [ Mov (env'#loc x, rax); Mov (rax, s) ]
|
|
| _ -> [ Mov (env'#loc x, s) ] ))
|
|
| ST x -> (
|
|
let env' = env#variable x in
|
|
let s = env'#peek in
|
|
( env',
|
|
match s with
|
|
| S _ | M _ -> [ Mov (s, rax); Mov (rax, env'#loc x) ]
|
|
| _ -> [ Mov (s, env'#loc x) ] ))
|
|
| STA -> compile_call env ~fname:".sta" 3 false
|
|
| STI ->
|
|
failwith
|
|
"Should not happen. Indirect assignemts are temporarily \
|
|
prohibited."
|
|
(*
|
|
let v, env = env#pop in
|
|
let x = env#peek in
|
|
( env,
|
|
match x with
|
|
| S _ | M _ ->
|
|
[
|
|
Mov (v, rdx);
|
|
Mov (x, rax);
|
|
Mov (rdx, I (0, rax));
|
|
Mov (rdx, x);
|
|
]
|
|
| _ -> [ Mov (v, rax); Mov (rax, I (0, x)); Mov (rax, x) ] )*)
|
|
| BINOP op -> compile_binop env op
|
|
| LABEL s | FLABEL s | SLABEL s -> (env, [ Label s ])
|
|
| JMP l -> ((env#set_stack l)#set_barrier, [ Jmp l ])
|
|
| CJMP (s, l) ->
|
|
let x, env = env#pop in
|
|
( env#set_stack l,
|
|
[ Sar1 x; (*!!!*) Binop ("cmp", L 0, x); CJmp (s, l) ] )
|
|
| BEGIN (f, nargs, nlocals, closure, _args, scopes) ->
|
|
let _ =
|
|
let is_safepoint = List.mem f safepoint_functions in
|
|
let is_vararg =
|
|
Option.is_some @@ List.assoc_opt f vararg_functions
|
|
in
|
|
if is_safepoint || is_vararg then
|
|
raise
|
|
(Failure
|
|
(Printf.sprintf
|
|
"Function name %s is reserved for built-in" f))
|
|
in
|
|
let rec stabs_scope scope =
|
|
let names =
|
|
List.map
|
|
(fun (name, index) ->
|
|
Meta
|
|
(Printf.sprintf "\t.stabs \"%s:1\",128,0,0,-%d" name
|
|
(stack_offset index)))
|
|
scope.names
|
|
in
|
|
let sub_stabs =
|
|
List.flatten @@ List.map stabs_scope scope.subs
|
|
in
|
|
if names = [] then sub_stabs
|
|
else
|
|
names
|
|
@ [
|
|
Meta
|
|
(Printf.sprintf "\t.stabn 192,0,0,%s-%s" scope.blab f);
|
|
]
|
|
@ sub_stabs
|
|
@ [
|
|
Meta
|
|
(Printf.sprintf "\t.stabn 224,0,0,%s-%s" scope.elab f);
|
|
]
|
|
in
|
|
let name =
|
|
if f.[0] = 'L' then String.sub f 1 (String.length f - 1)
|
|
else f
|
|
in
|
|
let stabs =
|
|
opt_stabs env
|
|
(if f = "main" then
|
|
[ Meta (Printf.sprintf "\t.type main, @function") ]
|
|
else
|
|
let func =
|
|
[
|
|
Meta (Printf.sprintf "\t.type %s, @function" name);
|
|
Meta
|
|
(Printf.sprintf "\t.stabs \"%s:F1\",36,0,0,%s" name
|
|
f);
|
|
]
|
|
in
|
|
let arguments =
|
|
[] (* TODO: stabs for function arguments *)
|
|
in
|
|
let variables =
|
|
List.flatten @@ List.map stabs_scope scopes
|
|
in
|
|
func @ arguments @ variables)
|
|
in
|
|
let env, check_argc =
|
|
if f = cmd#topname then (env, [])
|
|
else
|
|
let argc_correct_label = f ^ "_argc_correct" in
|
|
let pat_addr, env =
|
|
env#string
|
|
"Function %s called with incorrect arguments count. \
|
|
Expected: %d. Actual: %d\\n"
|
|
in
|
|
let name_addr, env = env#string name in
|
|
let pat_loc, env = env#allocate in
|
|
let name_loc, env = env#allocate in
|
|
let expected_loc, env = env#allocate in
|
|
let actual_loc, env = env#allocate in
|
|
let env, fail_call =
|
|
compile_call env ~fname:"failure" 4 false
|
|
in
|
|
let _, env = env#pop in
|
|
( env,
|
|
[
|
|
Meta "# Check arguments count";
|
|
Binop ("cmp", L nargs, r11);
|
|
CJmp ("e", argc_correct_label);
|
|
Mov (r11, actual_loc);
|
|
Mov (L nargs, expected_loc);
|
|
Mov (name_addr, name_loc);
|
|
Mov (pat_addr, pat_loc);
|
|
]
|
|
@ fail_call
|
|
@ [ Label argc_correct_label ] )
|
|
in
|
|
env#assert_empty_stack;
|
|
let has_closure = closure <> [] in
|
|
let env = env#enter f nargs nlocals has_closure in
|
|
( env,
|
|
stabs
|
|
@ [ Meta "\t.cfi_startproc" ]
|
|
@ (if f = cmd#topname then
|
|
[
|
|
Mov (M (D, I, V, "init"), rax);
|
|
Binop ("test", rax, rax);
|
|
CJmp ("z", "continue");
|
|
Ret;
|
|
Label "_ERROR";
|
|
Call (labeled "binoperror");
|
|
Ret;
|
|
Label "_ERROR2";
|
|
Call (labeled "binoperror2");
|
|
Ret;
|
|
Label "continue";
|
|
Mov (L 1, M (D, I, V, "init"));
|
|
]
|
|
else [])
|
|
@ [
|
|
Push rbp;
|
|
Meta "\t.cfi_def_cfa_offset\t8";
|
|
Meta "\t.cfi_offset 5, -8";
|
|
Mov (rsp, rbp);
|
|
Meta "\t.cfi_def_cfa_register\t5";
|
|
Binop ("-", C env#lsize, rsp);
|
|
Mov (rdi, r12);
|
|
Mov (rsi, r13);
|
|
Mov (rcx, r14);
|
|
Mov (rsp, rdi);
|
|
Lea (filler, rsi);
|
|
Mov (C env#allocated_size, rcx);
|
|
Repmovsl;
|
|
Mov (r12, rdi);
|
|
Mov (r13, rsi);
|
|
Mov (r14, rcx);
|
|
]
|
|
@ (if f = "main" then
|
|
[
|
|
(* Align stack as `main` function could be called misaligned *)
|
|
Mov (L 0xF, rax);
|
|
Binop ("test", rsp, rax);
|
|
CJmp ("z", "ALIGNED");
|
|
Push filler;
|
|
Label "ALIGNED";
|
|
(* Initialize gc and arguments *)
|
|
Push rdi;
|
|
Push rsi;
|
|
Call "__gc_init";
|
|
Pop rsi;
|
|
Pop rdi;
|
|
Call "set_args";
|
|
]
|
|
else [])
|
|
@
|
|
if f = cmd#topname then
|
|
List.map
|
|
(fun i -> Call ("init" ^ i))
|
|
(List.filter (fun i -> i <> "Std") imports)
|
|
else [] @ check_argc )
|
|
| END ->
|
|
let x, env = env#pop in
|
|
env#assert_empty_stack;
|
|
let name = env#fname in
|
|
let stabs =
|
|
opt_stabs env
|
|
[ Meta (Printf.sprintf "\t.size %s, .-%s" name name) ]
|
|
in
|
|
( env#leave,
|
|
[
|
|
Mov (x, rax);
|
|
(*!!*)
|
|
Label env#epilogue;
|
|
Mov (rbp, rsp);
|
|
Pop rbp;
|
|
]
|
|
@ (if name = "main" then [ Binop ("^", rax, rax) ] else [])
|
|
@ [
|
|
Meta "\t.cfi_restore\trbp";
|
|
Meta "\t.cfi_def_cfa\t4, 4";
|
|
Ret;
|
|
Meta "\t.cfi_endproc";
|
|
Meta
|
|
(* Allocate space for the symbolic stack
|
|
Add extra word if needed to preserve alignment *)
|
|
(Printf.sprintf "\t.set\t%s,\t%d"
|
|
(env#prefixed env#lsize)
|
|
(if env#allocated mod 2 == 0 then
|
|
env#allocated * word_size
|
|
else (env#allocated + 1) * word_size));
|
|
Meta
|
|
(Printf.sprintf "\t.set\t%s,\t%d"
|
|
(env#prefixed env#allocated_size)
|
|
env#allocated);
|
|
]
|
|
@ stabs )
|
|
| RET ->
|
|
let x = env#peek in
|
|
(env, [ Mov (x, rax); Jmp env#epilogue ])
|
|
| ELEM -> compile_call env ~fname:".elem" 2 false
|
|
| CALL (fname, n, tail) -> compile_call env ~fname n tail
|
|
| CALLC (n, tail) -> compile_call env n tail
|
|
| SEXP (t, n) ->
|
|
let s, env = env#allocate in
|
|
let env, code = compile_call env ~fname:".sexp" (n + 1) false in
|
|
(env, mov (L (box (env#hash t))) s @ code)
|
|
| DROP -> (snd env#pop, [])
|
|
| DUP ->
|
|
let x = env#peek in
|
|
let s, env = env#allocate in
|
|
(env, mov x s)
|
|
| SWAP ->
|
|
let x, y = env#peek2 in
|
|
(env, [ Push x; Push y; Pop x; Pop y ])
|
|
| TAG (t, n) ->
|
|
let s1, env = env#allocate in
|
|
let s2, env = env#allocate in
|
|
let env, code = compile_call env ~fname:".tag" 3 false in
|
|
(env, mov (L (box (env#hash t))) s1 @ mov (L (box n)) s2 @ code)
|
|
| ARRAY n ->
|
|
let s, env = env#allocate in
|
|
let env, code = compile_call env ~fname:".array_patt" 2 false in
|
|
(env, [ Mov (L (box n), s) ] @ code)
|
|
| PATT StrCmp -> compile_call env ~fname:".string_patt" 2 false
|
|
| PATT patt ->
|
|
compile_call env
|
|
~fname:
|
|
(match patt with
|
|
| Boxed -> ".boxed_patt"
|
|
| UnBoxed -> ".unboxed_patt"
|
|
| Array -> ".array_tag_patt"
|
|
| String -> ".string_tag_patt"
|
|
| Sexp -> ".sexp_tag_patt"
|
|
| Closure -> ".closure_tag_patt"
|
|
| StrCmp ->
|
|
failwith
|
|
(Printf.sprintf "Unexpected pattern: StrCmp %s: %d"
|
|
__FILE__ __LINE__))
|
|
1 false
|
|
| LINE line -> env#gen_line line
|
|
| FAIL ((line, col), value) ->
|
|
let value, env = if value then (env#peek, env) else env#pop in
|
|
let msg_addr, env = env#string cmd#get_infile in
|
|
let value_arg_addr, env = env#allocate in
|
|
let msg_arg_addr, env = env#allocate in
|
|
let line_arg_addr, env = env#allocate in
|
|
let col_arg_addr, env = env#allocate in
|
|
let env, code =
|
|
compile_call env ~fname:".match_failure" 4 false
|
|
in
|
|
let _, env = env#pop in
|
|
( env,
|
|
mov (L col) col_arg_addr @ mov (L line) line_arg_addr
|
|
@ mov msg_addr msg_arg_addr @ mov value value_arg_addr @ code
|
|
)
|
|
| i ->
|
|
invalid_arg
|
|
(Printf.sprintf "invalid SM insn: %s\n" (GT.show insn i))
|
|
in
|
|
let env'', code'' = compile' env' scode' in
|
|
let debug_info =
|
|
let insn = GT.show SM.insn instr in
|
|
if env#mode.is_debug then
|
|
[ Meta ("# " ^ insn); Meta ("# " ^ stack_state) ]
|
|
else [ Meta ("# " ^ insn) ]
|
|
in
|
|
(env'', debug_info @ code' @ code'')
|
|
in
|
|
compile' env code
|
|
|
|
module AbstractSymbolicStack : sig
|
|
type 'a t
|
|
type 'a symbolic_location = Stack of int | Register of 'a
|
|
|
|
val empty : 'a array -> 'a t
|
|
val is_empty : _ t -> bool
|
|
val live_registers : 'a t -> 'a list
|
|
val stack_size : _ t -> int
|
|
val allocate : 'a t -> 'a t * 'a symbolic_location
|
|
val pop : 'a t -> 'a t * 'a symbolic_location
|
|
val peek : 'a t -> 'a symbolic_location
|
|
val peek2 : 'a t -> 'a symbolic_location * 'a symbolic_location
|
|
end = struct
|
|
type 'a symbolic_location = Stack of int | Register of 'a
|
|
|
|
(* Last allocated position on symbolic stack *)
|
|
type stack_state = S of int | R of int | E
|
|
type 'a t = stack_state * 'a array
|
|
|
|
let empty registers = (E, registers)
|
|
|
|
let next (state, registers) =
|
|
let state =
|
|
match state with
|
|
| S n -> S (n + 1)
|
|
| R n when n + 1 = Array.length registers -> S 0
|
|
| R n -> R (n + 1)
|
|
| E -> R 0
|
|
in
|
|
(state, registers)
|
|
|
|
let previos (state, registers) =
|
|
let state =
|
|
match state with
|
|
| S 0 -> R (Array.length registers - 1)
|
|
| S n -> S (n - 1)
|
|
| R 0 -> E
|
|
| R n -> R (n - 1)
|
|
| E -> failwith (Printf.sprintf "Empty stack %s: %d" __FILE__ __LINE__)
|
|
in
|
|
(state, registers)
|
|
|
|
let location (state, registers) =
|
|
match state with
|
|
| S n -> Stack n
|
|
| R n -> Register registers.(n)
|
|
| E -> failwith (Printf.sprintf "Empty stack %s: %d" __FILE__ __LINE__)
|
|
|
|
let is_empty (state, _) = match state with E -> true | _ -> false
|
|
|
|
let live_registers (stack, registers) =
|
|
match stack with
|
|
| S _ -> Array.to_list registers
|
|
| R n -> Array.to_list (Array.sub registers 0 (n + 1))
|
|
| E -> []
|
|
|
|
let stack_size (state, _) = match state with S n -> n + 1 | R _ | E -> 0
|
|
|
|
let allocate state =
|
|
let state = next state in
|
|
(state, location state)
|
|
|
|
let pop stack = (previos stack, location stack)
|
|
let peek stack = location stack
|
|
let peek2 stack = (location stack, location (previos stack))
|
|
end
|
|
|
|
module SymbolicStack : sig
|
|
type t
|
|
|
|
val empty : int -> t
|
|
val is_empty : t -> bool
|
|
val live_registers : t -> opnd list
|
|
val stack_size : t -> int
|
|
val allocate : t -> t * opnd
|
|
val pop : t -> t * opnd
|
|
val peek : t -> opnd
|
|
val peek2 : t -> opnd * opnd
|
|
end = struct
|
|
type t = { state : Register.t AbstractSymbolicStack.t; nlocals : int }
|
|
|
|
(* To use free argument registers we have to rewrite function call compilation.
|
|
Otherwise we will result with the following code in arguments setup:
|
|
movq %rcx, %rdx
|
|
movq %rdx, %rsi *)
|
|
let empty nlocals =
|
|
{
|
|
state = AbstractSymbolicStack.empty Registers.extra_caller_saved_registers;
|
|
nlocals;
|
|
}
|
|
|
|
let opnd_from_loc v = function
|
|
| AbstractSymbolicStack.Register r -> R r
|
|
| AbstractSymbolicStack.Stack n -> S (n + v.nlocals)
|
|
|
|
let is_empty v = AbstractSymbolicStack.is_empty v.state
|
|
|
|
let live_registers v =
|
|
List.map (fun r -> R r) (AbstractSymbolicStack.live_registers v.state)
|
|
|
|
let stack_size v = AbstractSymbolicStack.stack_size v.state
|
|
|
|
let allocate v =
|
|
let state, loc = AbstractSymbolicStack.allocate v.state in
|
|
({ v with state }, opnd_from_loc v loc)
|
|
|
|
let pop v =
|
|
let state, loc = AbstractSymbolicStack.pop v.state in
|
|
({ v with state }, opnd_from_loc v loc)
|
|
|
|
let peek v = opnd_from_loc v (AbstractSymbolicStack.peek v.state)
|
|
|
|
let peek2 v =
|
|
let loc1, loc2 = AbstractSymbolicStack.peek2 v.state in
|
|
(opnd_from_loc v loc1, opnd_from_loc v loc2)
|
|
end
|
|
|
|
(* A set of strings *)
|
|
module S = Set.Make (String)
|
|
|
|
(* A map indexed by strings *)
|
|
module M = Map.Make (String)
|
|
|
|
(* Environment implementation *)
|
|
class env prg mode =
|
|
let chars =
|
|
"_abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789'"
|
|
in
|
|
let argument_registers =
|
|
Array.map (fun r -> R r) Registers.argument_registers
|
|
in
|
|
let argument_registers_size = Array.length argument_registers in
|
|
object (self)
|
|
inherit SM.indexer prg
|
|
val globals = S.empty (* a set of global variables *)
|
|
val stringm : string M.t = M.empty (* a string map *)
|
|
val scount = 0 (* string count *)
|
|
val stack_slots = 0 (* maximal number of stack positions *)
|
|
val static_size = 0 (* static data size *)
|
|
val stack = SymbolicStack.empty 0 (* symbolic stack *)
|
|
val nargs = 0 (* number of function arguments *)
|
|
val locals = [] (* function local variables *)
|
|
val fname = "" (* function name *)
|
|
val stackmap = M.empty (* labels to stack map *)
|
|
val barrier = false (* barrier condition *)
|
|
val mode = mode (* compilation mode *)
|
|
|
|
val max_locals_size =
|
|
0 (* maximal number of stack position in all functions *)
|
|
|
|
val has_closure = false
|
|
val publics = S.empty
|
|
val externs = S.empty
|
|
val nlabels = 0
|
|
val first_line = true
|
|
method mode = mode
|
|
method publics = S.elements publics
|
|
method register_public name = {<publics = S.add name publics>}
|
|
method register_extern name = {<externs = S.add name externs>}
|
|
method max_locals_size = max_locals_size
|
|
method has_closure = has_closure
|
|
method fname = fname
|
|
|
|
method leave =
|
|
if stack_slots > max_locals_size then {<max_locals_size = stack_slots>}
|
|
else self
|
|
|
|
method show_stack =
|
|
let rec show stack acc =
|
|
if SymbolicStack.is_empty stack then acc
|
|
else
|
|
let stack, loc = SymbolicStack.pop stack in
|
|
show stack (show_opnd loc ^ " " ^ acc)
|
|
in
|
|
show stack ""
|
|
|
|
method print_locals =
|
|
Printf.printf "LOCALS: size = %d\n" static_size;
|
|
List.iter
|
|
(fun l ->
|
|
Printf.printf "(";
|
|
List.iter (fun (a, i) -> Printf.printf "%s=%d " a i) l;
|
|
Printf.printf ")\n")
|
|
locals;
|
|
Printf.printf "END LOCALS\n"
|
|
|
|
(* Assert empty stack *)
|
|
method assert_empty_stack = assert (SymbolicStack.is_empty stack)
|
|
|
|
(* check barrier condition *)
|
|
method is_barrier = barrier
|
|
|
|
(* set barrier *)
|
|
method set_barrier = {<barrier = true>}
|
|
|
|
(* drop barrier *)
|
|
method drop_barrier = {<barrier = false>}
|
|
|
|
(* drop stack *)
|
|
method drop_stack = {<stack = SymbolicStack.empty static_size>}
|
|
|
|
(* associates a stack to a label *)
|
|
method set_stack l = {<stackmap = M.add l stack stackmap>}
|
|
|
|
(* retrieves a stack for a label *)
|
|
method retrieve_stack l =
|
|
try {<stack = M.find l stackmap>} with Not_found -> self
|
|
|
|
(* checks if there is a stack for a label *)
|
|
method has_stack l = M.mem l stackmap
|
|
method is_external name = S.mem name externs
|
|
|
|
(* gets a location for a variable *)
|
|
method loc x =
|
|
match x with
|
|
| Value.Global name ->
|
|
let loc_name = labeled_global name in
|
|
let ext = if self#is_external name then E else I in
|
|
M (D, ext, V, loc_name)
|
|
| Value.Fun name ->
|
|
let ext = if self#is_external name then E else I in
|
|
M (F, ext, A, name)
|
|
| Value.Local i -> S i
|
|
| Value.Arg i when i < argument_registers_size -> argument_registers.(i)
|
|
| Value.Arg i -> S (-(i - argument_registers_size) - 1)
|
|
| Value.Access i -> I (word_size * (i + 1), r15)
|
|
|
|
(* allocates a fresh position on a symbolic stack *)
|
|
method allocate =
|
|
let stack, opnd = SymbolicStack.allocate stack in
|
|
let stack_slots =
|
|
max stack_slots (static_size + SymbolicStack.stack_size stack)
|
|
in
|
|
(opnd, {<stack_slots; stack>})
|
|
|
|
(* pops one operand from the symbolic stack *)
|
|
method pop =
|
|
let stack, opnd = SymbolicStack.pop stack in
|
|
(opnd, {<stack>})
|
|
|
|
(* is rdx register in use *)
|
|
method rdx_in_use = nargs > 2
|
|
|
|
method arguments_locations n =
|
|
if n < argument_registers_size then
|
|
( Array.to_list (Array.sub argument_registers 0 n)
|
|
|> List.map (fun r -> Register r),
|
|
0 )
|
|
else
|
|
( (Array.to_list argument_registers |> List.map (fun r -> Register r))
|
|
@ List.init (n - argument_registers_size) (fun _ -> Stack),
|
|
n - argument_registers_size )
|
|
|
|
(* peeks the top of the stack (the stack does not change) *)
|
|
method peek = SymbolicStack.peek stack
|
|
|
|
(* peeks two topmost values from the stack (the stack itself does not change) *)
|
|
method peek2 = SymbolicStack.peek2 stack
|
|
|
|
(* tag hash: gets a hash for a string tag *)
|
|
method hash tag =
|
|
let h = Stdlib.ref 0 in
|
|
for i = 0 to min (String.length tag - 1) 9 do
|
|
h := (!h lsl 6) lor String.index chars tag.[i]
|
|
done;
|
|
!h
|
|
|
|
(* registers a variable in the environment *)
|
|
method variable x =
|
|
match x with
|
|
| Value.Global name -> {<globals = S.add (labeled_global name) globals>}
|
|
| _ -> self
|
|
|
|
(* registers a string constant *)
|
|
method string x =
|
|
let escape x =
|
|
let n = String.length x in
|
|
let buf = Buffer.create (n * 2) in
|
|
let rec iterate i =
|
|
if i < n then
|
|
match x.[i] with
|
|
| '"' ->
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf '"';
|
|
iterate (i + 1)
|
|
| '\\' -> (
|
|
if i + 1 >= n then (
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf '\\')
|
|
else
|
|
match x.[i + 1] with
|
|
| 'n' ->
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf 'n';
|
|
iterate (i + 2)
|
|
| 't' ->
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf 't';
|
|
iterate (i + 2)
|
|
| 'r' ->
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf 'r';
|
|
iterate (i + 2)
|
|
| _ ->
|
|
Buffer.add_char buf '\\';
|
|
Buffer.add_char buf '\\';
|
|
iterate (i + 1))
|
|
| c ->
|
|
Buffer.add_char buf c;
|
|
iterate (i + 1)
|
|
in
|
|
iterate 0;
|
|
Buffer.contents buf
|
|
in
|
|
let x = escape x in
|
|
let name = M.find_opt x stringm in
|
|
match name with
|
|
| Some name -> (M (D, I, A, name), self)
|
|
| None ->
|
|
let name = Printf.sprintf "string_%d" scount in
|
|
let m = M.add x name stringm in
|
|
(M (D, I, A, name), {<scount = scount + 1; stringm = m>})
|
|
|
|
(* gets number of arguments in the current function *)
|
|
method nargs = nargs
|
|
|
|
(* gets all global variables *)
|
|
method globals = S.elements (S.diff globals externs)
|
|
|
|
(* gets all string definitions *)
|
|
method strings = M.bindings stringm
|
|
|
|
(* gets a number of stack positions allocated *)
|
|
method allocated = stack_slots
|
|
method allocated_size = labeled (Printf.sprintf "S%s_SIZE" fname)
|
|
|
|
(* enters a function *)
|
|
method enter f nargs nlocals has_closure =
|
|
{<nargs
|
|
; static_size = nlocals
|
|
; stack_slots = nlocals
|
|
; stack = SymbolicStack.empty nlocals
|
|
; fname = f
|
|
; has_closure
|
|
; first_line = true>}
|
|
|
|
(* returns a label for the epilogue *)
|
|
method epilogue = labeled (Printf.sprintf "%s_epilogue" fname)
|
|
|
|
(* returns a name for local size meta-symbol *)
|
|
method lsize = labeled (Printf.sprintf "%s_SIZE" fname)
|
|
|
|
(* returns a list of live registers *)
|
|
method live_registers =
|
|
Array.to_list
|
|
(Array.sub argument_registers 0
|
|
(min nargs (Array.length argument_registers)))
|
|
@ SymbolicStack.live_registers stack
|
|
|
|
(* generate a line number information for current function *)
|
|
method gen_line line =
|
|
let lab = Printf.sprintf ".L%d" nlabels in
|
|
( {<nlabels = nlabels + 1; first_line = false>},
|
|
if fname = "main" then
|
|
opt_stabs self
|
|
[ Meta (Printf.sprintf "\t.stabn 68,0,%d,%s" line lab) ]
|
|
@ [ Label lab ]
|
|
else
|
|
(if first_line then
|
|
opt_stabs self [ Meta (Printf.sprintf "\t.stabn 68,0,%d,0" line) ]
|
|
else [])
|
|
@ opt_stabs self
|
|
[ Meta (Printf.sprintf "\t.stabn 68,0,%d,%s-%s" line lab fname) ]
|
|
@ [ Label lab ] )
|
|
|
|
method prefixed label =
|
|
match mode.target_os with Darwin -> "_" ^ label | Linux -> label
|
|
end
|
|
|
|
(* Generates an assembler text for a program:
|
|
first compiles the program into the stack code,
|
|
then generates assember code,
|
|
then prints the assembler file *)
|
|
let genasm cmd prog =
|
|
let mode = { is_debug = cmd#is_debug; target_os = cmd#target_os } in
|
|
let sm = SM.compile cmd prog in
|
|
let env, code = compile cmd (new env sm mode) (fst (fst prog)) sm in
|
|
let globals =
|
|
List.map
|
|
(fun s -> Meta (Printf.sprintf "\t.globl\t%s" (env#prefixed s)))
|
|
env#publics
|
|
in
|
|
let data =
|
|
[ Meta "\t.data" ]
|
|
@ List.map
|
|
(fun (s, v) ->
|
|
Meta (Printf.sprintf "%s:\t.string\t\"%s\"" (env#prefixed v) s))
|
|
env#strings
|
|
@ [
|
|
Meta (env#prefixed "init" ^ ":\t.quad 0");
|
|
Meta
|
|
(match env#mode.target_os with
|
|
| Darwin -> "\t.section __DATA, custom_data, regular, no_dead_strip"
|
|
| Linux -> "\t.section custom_data,\"aw\",@progbits");
|
|
Meta
|
|
(Printf.sprintf "%s:\t.fill\t%d, 8, 1" (env#prefixed "filler")
|
|
env#max_locals_size);
|
|
]
|
|
@ List.concat
|
|
@@ List.map
|
|
(fun s ->
|
|
let unlabled_s =
|
|
String.sub s
|
|
(String.length global_label)
|
|
(String.length s - String.length global_label)
|
|
in
|
|
opt_stabs env
|
|
[
|
|
Meta (Printf.sprintf "\t.stabs \"%s:S1\",40,0,0,%s" unlabled_s s);
|
|
]
|
|
@ [ Meta (Printf.sprintf "%s:\t.quad\t1" (env#prefixed s)) ])
|
|
env#globals
|
|
in
|
|
let asm = Buffer.create 1024 in
|
|
List.iter
|
|
(fun i -> Buffer.add_string asm (Printf.sprintf "%s\n" @@ show env i))
|
|
([ Meta (Printf.sprintf "\t.file \"%s\"" cmd#get_absolute_infile) ]
|
|
@ opt_stabs env
|
|
[
|
|
Meta
|
|
(Printf.sprintf "\t.stabs \"%s\",100,0,0,.Ltext"
|
|
cmd#get_absolute_infile);
|
|
]
|
|
@ globals @ data
|
|
@ [ Meta "\t.text"; Label ".Ltext" ]
|
|
@ opt_stabs env [ Meta "\t.stabs \"data:t1=r1;0;4294967295;\",128,0,0,0" ]
|
|
@ code);
|
|
Buffer.contents asm
|
|
|
|
(* Builds a program: generates the assembler file and compiles it with the clang toolchain *)
|
|
let build cmd prog =
|
|
let find_objects imports paths =
|
|
let module S = Set.Make (String) in
|
|
let rec iterate acc s = function
|
|
| [] -> acc
|
|
| import :: imports ->
|
|
if S.mem import s then iterate acc s imports
|
|
else
|
|
let path, intfs = Interface.find import paths in
|
|
iterate
|
|
(Filename.concat path (import ^ ".o") :: acc)
|
|
(S.add import s)
|
|
((List.map (function
|
|
| `Import name -> name
|
|
| _ -> invalid_arg "must not happen")
|
|
@@ List.filter (function `Import _ -> true | _ -> false) intfs)
|
|
@ imports)
|
|
in
|
|
iterate [] (S.add "Std" S.empty) imports
|
|
in
|
|
cmd#dump_file "s" (genasm cmd prog);
|
|
cmd#dump_file "i" (Interface.gen prog);
|
|
let compiler =
|
|
match (cmd#target_os, cmd#march) with
|
|
| Darwin, `AMD64 -> "clang"
|
|
| Darwin, `X86_32 ->
|
|
Printf.eprintf "X86_32 on darwin is not supported\n";
|
|
exit 1
|
|
| Linux, `AMD64 -> "gcc"
|
|
| Linux, `X86_32 -> "gcc -m32"
|
|
in
|
|
let compiler_flags, linker_flags =
|
|
match cmd#target_os with
|
|
| Darwin -> ("-arch x86_64 -Wa,--noexecstack", "-ld_classic")
|
|
| Linux -> ("-Wa,--noexecstack", "")
|
|
in
|
|
let debug_flags = if cmd#is_debug then "-g" else "" in
|
|
match cmd#get_mode with
|
|
| `Default ->
|
|
let objs = find_objects (fst @@ fst prog) cmd#get_include_paths in
|
|
let buf = Buffer.create 255 in
|
|
List.iter
|
|
(fun o ->
|
|
Buffer.add_string buf o;
|
|
Buffer.add_string buf " ")
|
|
objs;
|
|
let gcc_cmdline =
|
|
Printf.sprintf "%s %s %s %s %s %s.s %s %s/%s.a" compiler compiler_flags
|
|
linker_flags debug_flags cmd#get_output_option cmd#basename
|
|
(Buffer.contents buf) cmd#get_runtime_path
|
|
(match cmd#march with `X86_32 -> "runtime32" | `AMD64 -> "runtime")
|
|
in
|
|
let result = Sys.command gcc_cmdline in
|
|
if result <> 0 then
|
|
failwith
|
|
(Printf.sprintf "Assembly compiler failed with exit code %d" result)
|
|
| `Compile ->
|
|
let cmd =
|
|
Printf.sprintf "%s %s %s -c -g %s.s" compiler compiler_flags debug_flags
|
|
cmd#basename
|
|
in
|
|
let result = Sys.command cmd in
|
|
if result <> 0 then
|
|
failwith
|
|
(Printf.sprintf "Assembly compiler failed with exit code %d" result)
|
|
| _ -> invalid_arg "must not happen"
|