ocaml/asmcomp/amd64/selection.ml

289 lines
10 KiB
OCaml

(**************************************************************************)
(* *)
(* OCaml *)
(* *)
(* Xavier Leroy, projet Cristal, INRIA Rocquencourt *)
(* *)
(* Copyright 2000 Institut National de Recherche en Informatique et *)
(* en Automatique. *)
(* *)
(* All rights reserved. This file is distributed under the terms of *)
(* the GNU Lesser General Public License version 2.1, with the *)
(* special exception on linking described in the file LICENSE. *)
(* *)
(**************************************************************************)
(* Instruction selection for the AMD64 *)
open Arch
open Proc
open Cmm
open Mach
(* Auxiliary for recognizing addressing modes *)
type addressing_expr =
Asymbol of string
| Alinear of expression
| Aadd of expression * expression
| Ascale of expression * int
| Ascaledadd of expression * expression * int
let rec select_addr exp =
match exp with
Cconst_symbol (s, _) when not !Clflags.dlcode ->
(Asymbol s, 0)
| Cop((Caddi | Caddv | Cadda), [arg; Cconst_int (m, _)], _) ->
let (a, n) = select_addr arg in (a, n + m)
| Cop(Csubi, [arg; Cconst_int (m, _)], _) ->
let (a, n) = select_addr arg in (a, n - m)
| Cop((Caddi | Caddv | Cadda), [Cconst_int (m, _); arg], _) ->
let (a, n) = select_addr arg in (a, n + m)
| Cop(Clsl, [arg; Cconst_int((1|2|3 as shift), _)], _) ->
begin match select_addr arg with
(Alinear e, n) -> (Ascale(e, 1 lsl shift), n lsl shift)
| _ -> (Alinear exp, 0)
end
| Cop(Cmuli, [arg; Cconst_int((2|4|8 as mult), _)], _) ->
begin match select_addr arg with
(Alinear e, n) -> (Ascale(e, mult), n * mult)
| _ -> (Alinear exp, 0)
end
| Cop(Cmuli, [Cconst_int((2|4|8 as mult), _); arg], _) ->
begin match select_addr arg with
(Alinear e, n) -> (Ascale(e, mult), n * mult)
| _ -> (Alinear exp, 0)
end
| Cop((Caddi | Caddv | Cadda), [arg1; arg2], _) ->
begin match (select_addr arg1, select_addr arg2) with
((Alinear e1, n1), (Alinear e2, n2)) ->
(Aadd(e1, e2), n1 + n2)
| ((Alinear e1, n1), (Ascale(e2, scale), n2)) ->
(Ascaledadd(e1, e2, scale), n1 + n2)
| ((Ascale(e1, scale), n1), (Alinear e2, n2)) ->
(Ascaledadd(e2, e1, scale), n1 + n2)
| (_, (Ascale(e2, scale), n2)) ->
(Ascaledadd(arg1, e2, scale), n2)
| ((Ascale(e1, scale), n1), _) ->
(Ascaledadd(arg2, e1, scale), n1)
| _ ->
(Aadd(arg1, arg2), 0)
end
| arg ->
(Alinear arg, 0)
(* Special constraints on operand and result registers *)
exception Use_default
let rax = phys_reg 0
let rcx = phys_reg 5
let rdx = phys_reg 4
let pseudoregs_for_operation op arg res =
match op with
(* Two-address binary operations: arg.(0) and res.(0) must be the same *)
Iintop(Iadd|Isub|Imul|Iand|Ior|Ixor) | Iaddf|Isubf|Imulf|Idivf ->
([|res.(0); arg.(1)|], res)
(* One-address unary operations: arg.(0) and res.(0) must be the same *)
| Iintop_imm((Iadd|Isub|Imul|Iand|Ior|Ixor|Ilsl|Ilsr|Iasr), _)
| Iabsf | Inegf
| Ispecific(Ibswap (32|64)) ->
(res, res)
(* For xchg, args must be a register allowing access to high 8 bit register
(rax, rbx, rcx or rdx). Keep it simple, just force the argument in rax. *)
| Ispecific(Ibswap 16) ->
([| rax |], [| rax |])
(* For imulq, first arg must be in rax, rax is clobbered, and result is in
rdx. *)
| Iintop(Imulh) ->
([| rax; arg.(1) |], [| rdx |])
| Ispecific(Ifloatarithmem(_,_)) ->
let arg' = Array.copy arg in
arg'.(0) <- res.(0);
(arg', res)
(* For shifts with variable shift count, second arg must be in rcx *)
| Iintop(Ilsl|Ilsr|Iasr) ->
([|res.(0); rcx|], res)
(* For div and mod, first arg must be in rax, rdx is clobbered,
and result is in rax or rdx respectively.
Keep it simple, just force second argument in rcx. *)
| Iintop(Idiv) ->
([| rax; rcx |], [| rax |])
| Iintop(Imod) ->
([| rax; rcx |], [| rdx |])
(* Other instructions are regular *)
| _ -> raise Use_default
(* If you update [inline_ops], you may need to update [is_simple_expr] and/or
[effects_of], below. *)
let inline_ops =
[ "sqrt"; "caml_bswap16_direct"; "caml_int32_direct_bswap";
"caml_int64_direct_bswap"; "caml_nativeint_direct_bswap" ]
let is_immediate n = n <= 0x7FFF_FFFF && n >= -0x8000_0000
let is_immediate_natint n = n <= 0x7FFF_FFFFn && n >= -0x8000_0000n
(* The selector class *)
class selector = object (self)
inherit Selectgen.selector_generic as super
method! is_immediate op n =
match op with
| Iadd | Isub | Imul | Iand | Ior | Ixor | Icomp _ | Icheckbound _ ->
is_immediate n
| _ ->
super#is_immediate op n
method is_immediate_test _cmp n = is_immediate n
method! is_simple_expr e =
match e with
| Cop(Cextcall (fn, _, _, _, _), args, _)
when List.mem fn inline_ops ->
(* inlined ops are simple if their arguments are *)
List.for_all self#is_simple_expr args
| _ ->
super#is_simple_expr e
method! effects_of e =
match e with
| Cop(Cextcall(fn, _, _, _, _), args, _)
when List.mem fn inline_ops ->
Selectgen.Effect_and_coeffect.join_list_map args self#effects_of
| _ ->
super#effects_of e
method select_addressing _chunk exp =
let (a, d) = select_addr exp in
(* PR#4625: displacement must be a signed 32-bit immediate *)
if not (is_immediate d)
then (Iindexed 0, exp)
else match a with
| Asymbol s ->
(Ibased(s, d), Ctuple [])
| Alinear e ->
(Iindexed d, e)
| Aadd(e1, e2) ->
(Iindexed2 d, Ctuple[e1; e2])
| Ascale(e, scale) ->
(Iscaled(scale, d), e)
| Ascaledadd(e1, e2, scale) ->
(Iindexed2scaled(scale, d), Ctuple[e1; e2])
method! select_store is_assign addr exp =
match exp with
Cconst_int (n, _dbg) when is_immediate n ->
(Ispecific(Istore_int(Nativeint.of_int n, addr, is_assign)), Ctuple [])
| (Cconst_natint (n, _dbg)) when is_immediate_natint n ->
(Ispecific(Istore_int(n, addr, is_assign)), Ctuple [])
| (Cblockheader(n, _dbg))
when is_immediate_natint n ->
(Ispecific(Istore_int(n, addr, is_assign)), Ctuple [])
| _ ->
super#select_store is_assign addr exp
method! select_operation op args dbg =
match op with
(* Recognize the LEA instruction *)
Caddi | Caddv | Cadda | Csubi ->
begin match self#select_addressing Word_int (Cop(op, args, dbg)) with
(Iindexed _, _)
| (Iindexed2 0, _) -> super#select_operation op args dbg
| (addr, arg) -> (Ispecific(Ilea addr), [arg])
end
(* Recognize float arithmetic with memory. *)
| Caddf ->
self#select_floatarith true Iaddf Ifloatadd args
| Csubf ->
self#select_floatarith false Isubf Ifloatsub args
| Cmulf ->
self#select_floatarith true Imulf Ifloatmul args
| Cdivf ->
self#select_floatarith false Idivf Ifloatdiv args
| Cextcall("sqrt", _, _, false, _) ->
begin match args with
[Cop(Cload ((Double|Double_u as chunk), _), [loc], _dbg)] ->
let (addr, arg) = self#select_addressing chunk loc in
(Ispecific(Ifloatsqrtf addr), [arg])
| [arg] ->
(Ispecific Isqrtf, [arg])
| _ ->
assert false
end
(* Recognize store instructions *)
| Cstore ((Word_int|Word_val as chunk), _init) ->
begin match args with
[loc; Cop(Caddi, [Cop(Cload _, [loc'], _); Cconst_int (n, _dbg)], _)]
when loc = loc' && is_immediate n ->
let (addr, arg) = self#select_addressing chunk loc in
(Ispecific(Ioffset_loc(n, addr)), [arg])
| _ ->
super#select_operation op args dbg
end
| Cextcall("caml_bswap16_direct", _, _, _, _) ->
(Ispecific (Ibswap 16), args)
| Cextcall("caml_int32_direct_bswap", _, _, _, _) ->
(Ispecific (Ibswap 32), args)
| Cextcall("caml_int64_direct_bswap", _, _, _, _)
| Cextcall("caml_nativeint_direct_bswap", _, _, _, _) ->
(Ispecific (Ibswap 64), args)
(* Recognize sign extension *)
| Casr ->
begin match args with
[Cop(Clsl, [k; Cconst_int (32, _)], _); Cconst_int (32, _)] ->
(Ispecific Isextend32, [k])
| _ -> super#select_operation op args dbg
end
(* Recognize zero extension *)
| Cand ->
begin match args with
| [arg; Cconst_int (0xffff_ffff, _)]
| [arg; Cconst_natint (0xffff_ffffn, _)]
| [Cconst_int (0xffff_ffff, _); arg]
| [Cconst_natint (0xffff_ffffn, _); arg] ->
Ispecific Izextend32, [arg]
| _ -> super#select_operation op args dbg
end
| _ -> super#select_operation op args dbg
(* Recognize float arithmetic with mem *)
method select_floatarith commutative regular_op mem_op args =
match args with
[arg1; Cop(Cload ((Double|Double_u as chunk), _), [loc2], _)] ->
let (addr, arg2) = self#select_addressing chunk loc2 in
(Ispecific(Ifloatarithmem(mem_op, addr)),
[arg1; arg2])
| [Cop(Cload ((Double|Double_u as chunk), _), [loc1], _); arg2]
when commutative ->
let (addr, arg1) = self#select_addressing chunk loc1 in
(Ispecific(Ifloatarithmem(mem_op, addr)),
[arg2; arg1])
| [arg1; arg2] ->
(regular_op, [arg1; arg2])
| _ ->
assert false
method! mark_c_tailcall =
contains_calls := true
(* Deal with register constraints *)
method! insert_op_debug env op dbg rs rd =
try
let (rsrc, rdst) = pseudoregs_for_operation op rs rd in
self#insert_moves env rs rsrc;
self#insert_debug env (Iop op) dbg rsrc rdst;
self#insert_moves env rdst rd;
rd
with Use_default ->
super#insert_op_debug env op dbg rs rd
end
let fundecl f = (new selector)#emit_fundecl f