%% -*- erlang-indent-level: 2 -*- %% %% %CopyrightBegin% %% %% Copyright Ericsson AB 2002-2009. All Rights Reserved. %% %% The contents of this file are subject to the Erlang Public License, %% Version 1.1, (the "License"); you may not use this file except in %% compliance with the License. You should have received a copy of the %% Erlang Public License along with this software. If not, it can be %% retrieved online at http://www.erlang.org/. %% %% Software distributed under the License is distributed on an "AS IS" %% basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See %% the License for the specific language governing rights and limitations %% under the License. %% %% %CopyrightEnd% %% -module(hipe_sparc_frame). -export([frame/1]). -include("hipe_sparc.hrl"). -include("../rtl/hipe_literals.hrl"). frame(Defun) -> Formals = fix_formals(hipe_sparc:defun_formals(Defun)), Temps0 = all_temps(hipe_sparc:defun_code(Defun), Formals), MinFrame = defun_minframe(Defun), Temps = ensure_minframe(MinFrame, Temps0), ClobbersRA = clobbers_ra(hipe_sparc:defun_code(Defun)), CFG0 = hipe_sparc_cfg:init(Defun), Liveness = hipe_sparc_liveness_all:analyse(CFG0), CFG1 = do_body(CFG0, Liveness, Formals, Temps, ClobbersRA), hipe_sparc_cfg:linearise(CFG1). fix_formals(Formals) -> fix_formals(hipe_sparc_registers:nr_args(), Formals). fix_formals(0, Rest) -> Rest; fix_formals(N, [_|Rest]) -> fix_formals(N-1, Rest); fix_formals(_, []) -> []. do_body(CFG0, Liveness, Formals, Temps, ClobbersRA) -> Context = mk_context(Liveness, Formals, Temps, ClobbersRA), CFG1 = do_blocks(CFG0, Context), do_prologue(CFG1, Context). do_blocks(CFG, Context) -> Labels = hipe_sparc_cfg:labels(CFG), do_blocks(Labels, CFG, Context). do_blocks([Label|Labels], CFG, Context) -> Liveness = context_liveness(Context), LiveOut = hipe_sparc_liveness_all:liveout(Liveness, Label), Block = hipe_sparc_cfg:bb(CFG, Label), Code = hipe_bb:code(Block), NewCode = do_block(Code, LiveOut, Context), NewBlock = hipe_bb:code_update(Block, NewCode), NewCFG = hipe_sparc_cfg:bb_add(CFG, Label, NewBlock), do_blocks(Labels, NewCFG, Context); do_blocks([], CFG, _) -> CFG. do_block(Insns, LiveOut, Context) -> do_block(Insns, LiveOut, Context, context_framesize(Context), []). do_block([I|Insns], LiveOut, Context, FPoff0, RevCode) -> {NewIs, FPoff1} = do_insn(I, LiveOut, Context, FPoff0), do_block(Insns, LiveOut, Context, FPoff1, lists:reverse(NewIs, RevCode)); do_block([], _, Context, FPoff, RevCode) -> FPoff0 = context_framesize(Context), if FPoff =:= FPoff0 -> []; true -> exit({?MODULE,do_block,FPoff}) end, lists:reverse(RevCode, []). do_insn(I, LiveOut, Context, FPoff) -> case I of #pseudo_call{} -> do_pseudo_call(I, LiveOut, Context, FPoff); #pseudo_call_prepare{} -> do_pseudo_call_prepare(I, FPoff); #pseudo_move{} -> {do_pseudo_move(I, Context, FPoff), FPoff}; #pseudo_ret{} -> {do_pseudo_ret(I, Context, FPoff), context_framesize(Context)}; #pseudo_tailcall{} -> {do_pseudo_tailcall(I, Context), context_framesize(Context)}; #pseudo_fmove{} -> {do_pseudo_fmove(I, Context, FPoff), FPoff}; _ -> {[I], FPoff} end. %%% %%% Moves, with Dst or Src possibly a pseudo %%% do_pseudo_move(I, Context, FPoff) -> Dst = hipe_sparc:pseudo_move_dst(I), Src = hipe_sparc:pseudo_move_src(I), case temp_is_pseudo(Dst) of true -> Offset = pseudo_offset(Dst, FPoff, Context), mk_store(Src, hipe_sparc:mk_sp(), Offset, []); _ -> case temp_is_pseudo(Src) of true -> Offset = pseudo_offset(Src, FPoff, Context), mk_load(hipe_sparc:mk_sp(), Offset, Dst, []); _ -> [hipe_sparc:mk_mov(Src, Dst)] end end. do_pseudo_fmove(I, Context, FPoff) -> Dst = hipe_sparc:pseudo_fmove_dst(I), Src = hipe_sparc:pseudo_fmove_src(I), case temp_is_pseudo(Dst) of true -> Offset = pseudo_offset(Dst, FPoff, Context), mk_fstore(Src, hipe_sparc:mk_sp(), Offset); _ -> case temp_is_pseudo(Src) of true -> Offset = pseudo_offset(Src, FPoff, Context), mk_fload(hipe_sparc:mk_sp(), Offset, Dst); _ -> [hipe_sparc:mk_fp_unary('fmovd', Src, Dst)] end end. pseudo_offset(Temp, FPoff, Context) -> FPoff + context_offset(Context, Temp). %%% %%% Return - deallocate frame and emit 'ret $N' insn. %%% do_pseudo_ret(I, Context, FPoff) -> %% XXX: typically only one instruction between %% the move-to-RA and the jmp-via-RA, ouch restore_ra(FPoff, Context, adjust_sp(FPoff + word_size() * context_arity(Context), [I])). restore_ra(FPoff, Context, Rest) -> case context_clobbers_ra(Context) of false -> Rest; true -> RA = hipe_sparc:mk_ra(), mk_load(hipe_sparc:mk_sp(), FPoff - word_size(), RA, Rest) end. adjust_sp(N, Rest) -> if N =:= 0 -> Rest; true -> SP = hipe_sparc:mk_sp(), hipe_sparc:mk_addi(SP, N, SP, Rest) end. %%% %%% Recursive calls. %%% do_pseudo_call_prepare(I, FPoff0) -> %% Create outgoing arguments area on the stack. NrStkArgs = hipe_sparc:pseudo_call_prepare_nrstkargs(I), Offset = NrStkArgs * word_size(), {adjust_sp(-Offset, []), FPoff0 + Offset}. do_pseudo_call(I, LiveOut, Context, FPoff0) -> #sparc_sdesc{exnlab=ExnLab,arity=OrigArity} = hipe_sparc:pseudo_call_sdesc(I), FunV = hipe_sparc:pseudo_call_funv(I), LiveTemps = [Temp || Temp <- LiveOut, temp_is_pseudo(Temp)], SDesc = mk_sdesc(ExnLab, Context, LiveTemps), ContLab = hipe_sparc:pseudo_call_contlab(I), Linkage = hipe_sparc:pseudo_call_linkage(I), CallCode = [hipe_sparc:mk_pseudo_call(FunV, SDesc, ContLab, Linkage)], StkArity = erlang:max(0, OrigArity - hipe_sparc_registers:nr_args()), context_need_stack(Context, stack_need(FPoff0, StkArity, FunV)), ArgsBytes = word_size() * StkArity, {CallCode, FPoff0 - ArgsBytes}. stack_need(FPoff, StkArity, FunV) -> case FunV of #sparc_prim{} -> FPoff; #sparc_mfa{m=M,f=F,a=A} -> case erlang:is_builtin(M, F, A) of true -> FPoff; false -> stack_need_general(FPoff, StkArity) end; _ -> stack_need_general(FPoff, StkArity) end. stack_need_general(FPoff, StkArity) -> erlang:max(FPoff, FPoff + (?SPARC_LEAF_WORDS - StkArity) * word_size()). %%% %%% Create stack descriptors for call sites. %%% mk_sdesc(ExnLab, Context, Temps) -> % for normal calls Temps0 = only_tagged(Temps), Live = mk_live(Context, Temps0), Arity = context_arity(Context), FSize = context_framesize(Context), hipe_sparc:mk_sdesc(ExnLab, (FSize div word_size())-1, Arity, list_to_tuple(Live)). only_tagged(Temps)-> [X || X <- Temps, hipe_sparc:temp_type(X) =:= 'tagged']. mk_live(Context, Temps) -> lists:sort([temp_to_slot(Context, Temp) || Temp <- Temps]). temp_to_slot(Context, Temp) -> (context_framesize(Context) + context_offset(Context, Temp)) div word_size(). mk_minimal_sdesc(Context) -> % for inc_stack_0 calls hipe_sparc:mk_sdesc([], 0, context_arity(Context), {}). %%% %%% Tailcalls. %%% do_pseudo_tailcall(I, Context) -> % always at FPoff=context_framesize(Context) Arity = context_arity(Context), Args = hipe_sparc:pseudo_tailcall_stkargs(I), FunV = hipe_sparc:pseudo_tailcall_funv(I), Linkage = hipe_sparc:pseudo_tailcall_linkage(I), {Insns, FPoff1} = do_tailcall_args(Args, Context), context_need_stack(Context, FPoff1), StkArity = length(Args), FPoff2 = FPoff1 + (Arity - StkArity) * word_size(), context_need_stack(Context, stack_need(FPoff2, StkArity, FunV)), I2 = case FunV of #sparc_temp{} -> hipe_sparc:mk_jmp(FunV, hipe_sparc:mk_simm13(0), []); Fun -> hipe_sparc:mk_call_tail(Fun, Linkage) end, %% XXX: break out the RA restore, just like for pseudo_ret? restore_ra(context_framesize(Context), Context, Insns ++ adjust_sp(FPoff2, [I2])). do_tailcall_args(Args, Context) -> FPoff0 = context_framesize(Context), Arity = context_arity(Context), FrameTop = word_size()*Arity, DangerOff = FrameTop - word_size()*length(Args), %% Moves = mk_moves(Args, FrameTop, []), %% {Stores, Simple, Conflict} = split_moves(Moves, Context, DangerOff, [], [], []), %% sanity check (shouldn't trigger any more) if DangerOff < -FPoff0 -> exit({?MODULE,do_tailcall_args,DangerOff,-FPoff0}); true -> [] end, FPoff1 = FPoff0, %% {Pushes, Pops, FPoff2} = split_conflict(Conflict, FPoff1, [], []), %% TempReg = hipe_sparc_registers:temp1(), %% {adjust_sp(-(FPoff2 - FPoff1), simple_moves(Pushes, FPoff2, TempReg, store_moves(Stores, FPoff2, TempReg, simple_moves(Simple, FPoff2, TempReg, simple_moves(Pops, FPoff2, TempReg, []))))), FPoff2}. mk_moves([Arg|Args], Off, Moves) -> Off1 = Off - word_size(), mk_moves(Args, Off1, [{Arg,Off1}|Moves]); mk_moves([], _, Moves) -> Moves. split_moves([Move|Moves], Context, DangerOff, Stores, Simple, Conflict) -> {Src,DstOff} = Move, case src_is_pseudo(Src) of false -> split_moves(Moves, Context, DangerOff, [Move|Stores], Simple, Conflict); true -> SrcOff = context_offset(Context, Src), Type = typeof_temp(Src), if SrcOff =:= DstOff -> split_moves(Moves, Context, DangerOff, Stores, Simple, Conflict); SrcOff >= DangerOff -> split_moves(Moves, Context, DangerOff, Stores, Simple, [{SrcOff,DstOff,Type}|Conflict]); true -> split_moves(Moves, Context, DangerOff, Stores, [{SrcOff,DstOff,Type}|Simple], Conflict) end end; split_moves([], _, _, Stores, Simple, Conflict) -> {Stores, Simple, Conflict}. split_conflict([{SrcOff,DstOff,Type}|Conflict], FPoff, Pushes, Pops) -> FPoff1 = FPoff + word_size(), Push = {SrcOff,-FPoff1,Type}, Pop = {-FPoff1,DstOff,Type}, split_conflict(Conflict, FPoff1, [Push|Pushes], [Pop|Pops]); split_conflict([], FPoff, Pushes, Pops) -> {lists:reverse(Pushes), Pops, FPoff}. simple_moves([{SrcOff,DstOff,Type}|Moves], FPoff, TempReg, Rest) -> Temp = hipe_sparc:mk_temp(TempReg, Type), SP = hipe_sparc:mk_sp(), LoadOff = FPoff+SrcOff, StoreOff = FPoff+DstOff, simple_moves(Moves, FPoff, TempReg, mk_load(SP, LoadOff, Temp, mk_store(Temp, SP, StoreOff, Rest))); simple_moves([], _, _, Rest) -> Rest. store_moves([{Src,DstOff}|Moves], FPoff, TempReg, Rest) -> %% Type = typeof_temp(Src), SP = hipe_sparc:mk_sp(), StoreOff = FPoff+DstOff, {NewSrc,FixSrc} = case hipe_sparc:is_temp(Src) of true -> {Src, []}; _ -> Temp = hipe_sparc:mk_temp(TempReg, 'untagged'), {Temp, hipe_sparc:mk_set(Src, Temp)} end, store_moves(Moves, FPoff, TempReg, FixSrc ++ mk_store(NewSrc, SP, StoreOff, Rest)); store_moves([], _, _, Rest) -> Rest. %%% %%% Contexts %%% -record(context, {liveness, framesize, arity, map, clobbers_ra, ref_maxstack}). mk_context(Liveness, Formals, Temps, ClobbersRA) -> {Map, MinOff} = mk_temp_map(Formals, ClobbersRA, Temps), FrameSize = (-MinOff), RefMaxStack = hipe_bifs:ref(FrameSize), #context{liveness=Liveness, framesize=FrameSize, arity=length(Formals), map=Map, clobbers_ra=ClobbersRA, ref_maxstack=RefMaxStack}. context_need_stack(#context{ref_maxstack=RM}, N) -> M = hipe_bifs:ref_get(RM), if N > M -> hipe_bifs:ref_set(RM, N); true -> [] end. context_maxstack(#context{ref_maxstack=RM}) -> hipe_bifs:ref_get(RM). context_arity(#context{arity=Arity}) -> Arity. context_framesize(#context{framesize=FrameSize}) -> FrameSize. context_liveness(#context{liveness=Liveness}) -> Liveness. context_offset(#context{map=Map}, Temp) -> tmap_lookup(Map, Temp). context_clobbers_ra(#context{clobbers_ra=ClobbersRA}) -> ClobbersRA. mk_temp_map(Formals, ClobbersRA, Temps) -> {Map, 0} = enter_vars(Formals, word_size() * length(Formals), tmap_empty()), TempsList = tset_to_list(Temps), AllTemps = case ClobbersRA of false -> TempsList; true -> RA = hipe_sparc:mk_new_temp('untagged'), [RA|TempsList] end, enter_vars(AllTemps, 0, Map). enter_vars([V|Vs], PrevOff, Map) -> Off = case hipe_sparc:temp_type(V) of 'double' -> PrevOff - 2*word_size(); % XXX: sparc64: 1*word_size() _ -> PrevOff - word_size() end, enter_vars(Vs, Off, tmap_bind(Map, V, Off)); enter_vars([], Off, Map) -> {Map, Off}. tmap_empty() -> gb_trees:empty(). tmap_bind(Map, Key, Val) -> gb_trees:insert(Key, Val, Map). tmap_lookup(Map, Key) -> gb_trees:get(Key, Map). %%% %%% do_prologue: prepend stack frame allocation code. %%% %%% NewStart: %%% temp1 = *(P + P_SP_LIMIT) %%% temp2 = SP - MaxStack %%% cmp temp2, temp1 %%% if (ltu) goto IncStack else goto AllocFrame %%% AllocFrame: %%% SP = temp2 [if FrameSize == MaxStack] %%% SP -= FrameSize [if FrameSize != MaxStack] %%% *(SP + FrameSize-WordSize) = RA [if ClobbersRA] %%% goto OldStart %%% OldStart: %%% ... %%% IncStack: %%% temp1 = RA %%% call inc_stack; nop %%% RA = temp1 %%% goto NewStart do_prologue(CFG, Context) -> MaxStack = context_maxstack(Context), if MaxStack > 0 -> FrameSize = context_framesize(Context), OldStartLab = hipe_sparc_cfg:start_label(CFG), NewStartLab = hipe_gensym:get_next_label(sparc), %% P = hipe_sparc:mk_temp(hipe_sparc_registers:proc_pointer(), 'untagged'), Temp1 = hipe_sparc:mk_temp1(), SP = hipe_sparc:mk_sp(), %% RA = hipe_sparc:mk_ra(), ClobbersRA = context_clobbers_ra(Context), GotoOldStartCode = [hipe_sparc:mk_b_label(OldStartLab)], AllocFrameCodeTail = case ClobbersRA of false -> GotoOldStartCode; true -> mk_store(RA, SP, FrameSize-word_size(), GotoOldStartCode) end, %% Arity = context_arity(Context), Guaranteed = erlang:max(0, (?SPARC_LEAF_WORDS - Arity) * word_size()), %% {CFG1,NewStartCode} = if MaxStack =< Guaranteed -> %% io:format("~w: MaxStack ~w =< Guaranteed ~w :-)\n", [?MODULE,MaxStack,Guaranteed]), AllocFrameCode = adjust_sp(-FrameSize, AllocFrameCodeTail), NewStartCode0 = AllocFrameCode, % no mflr needed {CFG,NewStartCode0}; true -> %% io:format("~w: MaxStack ~w > Guaranteed ~w :-(\n", [?MODULE,MaxStack,Guaranteed]), AllocFrameLab = hipe_gensym:get_next_label(sparc), IncStackLab = hipe_gensym:get_next_label(sparc), Temp2 = hipe_sparc:mk_temp2(), %% NewStartCodeTail2 = [hipe_sparc:mk_pseudo_bp('lu', IncStackLab, AllocFrameLab, 0.01)], NewStartCodeTail1 = NewStartCodeTail2, % no mflr needed NewStartCode0 = mk_load(P, ?P_NSP_LIMIT, Temp1, hipe_sparc:mk_addi(SP, -MaxStack, Temp2, [hipe_sparc:mk_alu('subcc', Temp2, Temp1, hipe_sparc:mk_g0()) | NewStartCodeTail1])), %% AllocFrameCode = if MaxStack =:= FrameSize -> %% io:format("~w: MaxStack =:= FrameSize =:= ~w :-)\n", [?MODULE,MaxStack]), [hipe_sparc:mk_mov(Temp2, SP) | AllocFrameCodeTail]; true -> %% io:format("~w: MaxStack ~w =/= FrameSize ~w :-(\n", [?MODULE,MaxStack,FrameSize]), adjust_sp(-FrameSize, AllocFrameCodeTail) end, %% IncStackCodeTail = [hipe_sparc:mk_call_rec(hipe_sparc:mk_prim('inc_stack_0'), mk_minimal_sdesc(Context), not_remote), hipe_sparc:mk_mov(Temp1, RA), hipe_sparc:mk_b_label(NewStartLab)], IncStackCode = [hipe_sparc:mk_mov(RA, Temp1) | IncStackCodeTail], % mflr always needed %% CFG0a = hipe_sparc_cfg:bb_add(CFG, AllocFrameLab, hipe_bb:mk_bb(AllocFrameCode)), CFG0b = hipe_sparc_cfg:bb_add(CFG0a, IncStackLab, hipe_bb:mk_bb(IncStackCode)), %% {CFG0b,NewStartCode0} end, %% CFG2 = hipe_sparc_cfg:bb_add(CFG1, NewStartLab, hipe_bb:mk_bb(NewStartCode)), hipe_sparc_cfg:start_label_update(CFG2, NewStartLab); true -> CFG end. %%% Create a load instruction. %%% May clobber Dst early for large offsets. In principle we could %%% clobber TEMP2 if Dst =:= Base, but Dst =/= Base here in frame. mk_load(Base, Offset, Dst, Rest) -> LdOp = 'lduw', % XXX: sparc64: ldx hipe_sparc:mk_load(LdOp, Base, Offset, Dst, 'error', Rest). mk_fload(Base, Offset, Dst) -> hipe_sparc:mk_fload(Base, Offset, Dst, 'temp2'). %%% Create a store instruction. %%% May clobber TEMP2 for large offsets. mk_store(Src, Base, Offset, Rest) -> StOp = 'stw', % XXX: sparc64: stx hipe_sparc:mk_store(StOp, Src, Base, Offset, 'temp2', Rest). mk_fstore(Src, Base, Offset) -> hipe_sparc:mk_fstore(Src, Base, Offset, 'temp2'). %%% typeof_temp -- what's temp's type? typeof_temp(Temp) -> hipe_sparc:temp_type(Temp). %%% Check if an operand is a pseudo-Temp. src_is_pseudo(Src) -> hipe_sparc:is_temp(Src) andalso temp_is_pseudo(Src). temp_is_pseudo(Temp) -> not(hipe_sparc:temp_is_precoloured(Temp)). %%% %%% Detect if a Defun's body clobbers RA. %%% clobbers_ra(Insns) -> case Insns of [#pseudo_call{}|_] -> true; %% moves to RA cannot occur yet [_|Rest] -> clobbers_ra(Rest); [] -> false end. %%% %%% Build the set of all temps used in a Defun's body. %%% all_temps(Code, Formals) -> S0 = find_temps(Code, tset_empty()), S1 = tset_del_list(S0, Formals), tset_filter(S1, fun(T) -> temp_is_pseudo(T) end). find_temps([I|Insns], S0) -> S1 = tset_add_list(S0, hipe_sparc_defuse:insn_def_all(I)), S2 = tset_add_list(S1, hipe_sparc_defuse:insn_use_all(I)), find_temps(Insns, S2); find_temps([], S) -> S. tset_empty() -> gb_sets:new(). tset_size(S) -> gb_sets:size(S). tset_insert(S, T) -> gb_sets:add_element(T, S). tset_add_list(S, Ts) -> gb_sets:union(S, gb_sets:from_list(Ts)). tset_del_list(S, Ts) -> gb_sets:subtract(S, gb_sets:from_list(Ts)). tset_filter(S, F) -> gb_sets:filter(F, S). tset_to_list(S) -> gb_sets:to_list(S). %%% %%% Compute minimum permissible frame size, ignoring spilled temps. %%% This is done to ensure that we won't have to adjust the frame size %%% in the middle of a tailcall. %%% defun_minframe(Defun) -> MaxTailArity = body_mta(hipe_sparc:defun_code(Defun), 0), MyArity = length(fix_formals(hipe_sparc:defun_formals(Defun))), erlang:max(MaxTailArity - MyArity, 0). body_mta([I|Code], MTA) -> body_mta(Code, insn_mta(I, MTA)); body_mta([], MTA) -> MTA. insn_mta(I, MTA) -> case I of #pseudo_tailcall{arity=Arity} -> erlang:max(MTA, Arity - hipe_sparc_registers:nr_args()); _ -> MTA end. %%% %%% Ensure that we have enough temps to satisfy the minimum frame size, %%% if necessary by prepending unused dummy temps. %%% ensure_minframe(MinFrame, Temps) -> ensure_minframe(MinFrame, tset_size(Temps), Temps). ensure_minframe(MinFrame, Frame, Temps) -> if MinFrame > Frame -> Temp = hipe_sparc:mk_new_temp('untagged'), ensure_minframe(MinFrame, Frame+1, tset_insert(Temps, Temp)); true -> Temps end. word_size() -> hipe_rtl_arch:word_size().