%% %% %CopyrightBegin% %% %% Copyright Ericsson AB 2004-2016. All Rights Reserved. %% %% Licensed under the Apache License, Version 2.0 (the "License"); %% you may not use this file except in compliance with the License. %% You may obtain a copy of the License at %% %% http://www.apache.org/licenses/LICENSE-2.0 %% %% Unless required by applicable law or agreed to in writing, software %% distributed under the License is distributed on an "AS IS" BASIS, %% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. %% See the License for the specific language governing permissions and %% limitations under the License. %% %% %CopyrightEnd% %% %% Purpose: Optimizes booleans in guards. -module(beam_bool). -export([module/2]). -import(lists, [reverse/1,reverse/2,foldl/3,mapfoldl/3,map/2]). -record(st, {next, %Next label number. ll %Live regs at labels. }). module({Mod,Exp,Attr,Fs0,Lc}, _Opts) -> %%io:format("~p:\n", [Mod]), {Fs,_} = mapfoldl(fun(Fn, Lbl) -> function(Fn, Lbl) end, 100000000, Fs0), {ok,{Mod,Exp,Attr,Fs,Lc}}. function({function,Name,Arity,CLabel,Is0}, Lbl0) -> try {Is,#st{next=Lbl}} = bool_opt(Is0, Lbl0), {{function,Name,Arity,CLabel,Is},Lbl} catch Class:Error -> Stack = erlang:get_stacktrace(), io:fwrite("Function: ~w/~w\n", [Name,Arity]), erlang:raise(Class, Error, Stack) end. %% %% Optimize boolean expressions that use guard bifs. Rewrite to %% use test instructions if possible. %% bool_opt(Asm, Lbl) -> LiveInfo = beam_utils:index_labels(Asm), bopt(Asm, [], #st{next=Lbl,ll=LiveInfo}). bopt([{block,Bl0}=Block| [{jump,{f,Succ}}, {label,Fail}, {block,[{set,[Dst],[{atom,false}],move}]}, {label,Succ}|Is]=Is0], Acc0, St) -> case split_block(Bl0, Dst, Fail, Acc0, true) of failed -> bopt(Is0, [Block|Acc0], St); {Bl,PreBlock} -> Acc1 = case PreBlock of [] -> Acc0; _ -> [{block,PreBlock}|Acc0] end, Acc = [{protected,[Dst],Bl,{Fail,Succ}}|Acc1], bopt(Is, Acc, St) end; bopt([{test,is_eq_exact,{f,Fail},[Reg,{atom,true}]}=I|Is], [{block,_}|_]=Acc0, St0) -> case bopt_block(Reg, Fail, Is, Acc0, St0) of failed -> bopt(Is, [I|Acc0], St0); {Acc,St} -> bopt(Is, Acc, St) end; bopt([I|Is], Acc, St) -> bopt(Is, [I|Acc], St); bopt([], Acc, St) -> {bopt_reverse(Acc, []),St}. bopt_reverse([{protected,[Dst],Block,{Fail,Succ}}|Is], Acc0) -> Acc = [{block,Block},{jump,{f,Succ}}, {label,Fail}, {block,[{set,[Dst],[{atom,false}],move}]}, {label,Succ}|Acc0], bopt_reverse(Is, Acc); bopt_reverse([I|Is], Acc) -> bopt_reverse(Is, [I|Acc]); bopt_reverse([], Acc) -> Acc. %% bopt_block(Reg, Fail, OldIs, Accumulator, St) -> failed | {NewAcc,St} %% Attempt to optimized a block of guard BIFs followed by a test %% instruction. bopt_block(Reg, Fail, OldIs, [{block,Bl0}|Acc0], St0) -> case split_block(Bl0, Reg, Fail, Acc0, false) of failed -> %% Reason for failure: The block either contained no %% guard BIFs with the failure label Fail, or the final %% instruction in the block did not assign the Reg register. %%io:format("split ~p: ~P\n", [Reg,Bl0,20]), failed; {Bl1,BlPre} -> %% The block has been splitted. Bl1 is a non-empty list %% of guard BIF instructions having the failure label Fail. %% BlPre is a (possibly empty list) of instructions preceeding %% Bl1. Acc1 = make_block(BlPre, Acc0), {Bl,Acc} = extend_block(Bl1, Fail, Acc1), try {NewCode,St} = bopt_tree_cg(Bl, Fail, St0), ensure_opt_safe(Bl, NewCode, OldIs, Fail, Acc, St), {NewCode++Acc,St} catch %% Not possible to rewrite because a boolean value is %% passed to another guard bif, e.g. 'abs(A > B)' %% (in this case, obviously nonsense code). Rare in %% practice. throw:mixed -> failed; %% There was a reference to a boolean expression %% from inside a protected block (try/catch), to %% a boolean expression outside. throw:protected_barrier -> failed; %% The 'xor' operator was used. We currently don't %% find it worthwile to translate 'xor' operators %% (the code would be clumsy). throw:'xor' -> failed; %% The block does not contain a boolean expression, %% but only a call to a guard BIF. %% For instance: ... when element(1, T) -> throw:not_boolean_expr -> failed; %% The optimization is not safe. (A register %% used by the instructions following the %% optimized code is either not assigned a %% value at all or assigned a different value.) throw:all_registers_not_killed -> failed; throw:registers_used -> failed; %% A protected block refered to the value %% returned by another protected block, %% probably because the Core Erlang code %% used nested try/catches in the guard. %% (v3_core never produces nested try/catches %% in guards, so it must have been another %% Core Erlang translator.) throw:protected_violation -> failed; %% Failed to work out the live registers for a GC %% BIF. For example, if the number of live registers %% needed to be 4 because {x,3} was a source register, %% but {x,2} was not known to be initialized, this %% exception would be thrown. throw:gc_bif_alloc_failure -> failed end end. %% ensure_opt_safe(OriginalCode, OptCode, FollowingCode, Fail, %% ReversedPrecedingCode, State) -> ok %% Comparing the original code to the optimized code, determine %% whether the optimized code is guaranteed to work in the same %% way as the original code. %% %% Throw an exception if the optimization is not safe. %% ensure_opt_safe(Bl, NewCode, OldIs, Fail, PrecedingCode, St) -> %% Here are the conditions that must be true for the %% optimization to be safe. %% %% 1. If a register is INITIALIZED by PrecedingCode, %% then if that register assigned a value in the original %% code, but not in the optimized code, it must be UNUSED or KILLED %% in the code that follows. %% %% 2. If a register is not known to be INITIALIZED by PreccedingCode, %% then if that register assigned a value in the original %% code, but not in the optimized code, it must be KILLED %% by the code that follows. %% %% 3. Any register that is assigned a value in the optimized %% code must be UNUSED or KILLED in the following code, %% unless we can be sure that it is always assigned the same %% value. InitInPreceding = initialized_regs(PrecedingCode), PrevDst = dst_regs(Bl), NewDst = dst_regs(NewCode), NotSet = ordsets:subtract(PrevDst, NewDst), MustBeKilled = ordsets:subtract(NotSet, InitInPreceding), case all_killed(MustBeKilled, OldIs, Fail, St) of false -> throw(all_registers_not_killed); true -> ok end, MustBeUnused = ordsets:subtract(ordsets:union(NotSet, NewDst), MustBeKilled), case none_used(MustBeUnused, OldIs, Fail, St) of false -> throw(registers_used); true -> ok end, ok. update_fail_label([{set,Ds,As,{bif,N,{f,_}}}|Is], Fail, Acc) -> update_fail_label(Is, Fail, [{set,Ds,As,{bif,N,{f,Fail}}}|Acc]); update_fail_label([{set,Ds,As,{alloc,Regs,{gc_bif,N,{f,_}}}}|Is], Fail, Acc) -> update_fail_label(Is, Fail, [{set,Ds,As,{alloc,Regs,{gc_bif,N,{f,Fail}}}}|Acc]); update_fail_label([], _, Acc) -> reverse(Acc). make_block(Bl) -> make_block(Bl, []). make_block([], Acc) -> Acc; make_block(Bl, Acc) -> [{block,Bl}|Acc]. extend_block(BlAcc, Fail, [{protected,_,_,_}=Prot|OldAcc]) -> extend_block([Prot|BlAcc], Fail, OldAcc); extend_block(BlAcc0, Fail, [{block,Is0}|OldAcc]) -> case extend_block_1(reverse(Is0), Fail, BlAcc0) of {BlAcc,[]} -> extend_block(BlAcc, Fail, OldAcc); {BlAcc,Is} -> {BlAcc,[{block,Is}|OldAcc]} end; extend_block(BlAcc, _, OldAcc) -> {BlAcc,OldAcc}. extend_block_1([{set,[{x,_}],_,{bif,_,{f,Fail}}}=I|Is], Fail, Acc) -> extend_block_1(Is, Fail, [I|Acc]); extend_block_1([{set,[{x,_}],As,{bif,Bif,_}}=I|Is]=Is0, Fail, Acc) -> case safe_bool_op(Bif, length(As)) of false -> {Acc,reverse(Is0)}; true -> extend_block_1(Is, Fail, [I|Acc]) end; extend_block_1([_|_]=Is, _, Acc) -> {Acc,reverse(Is)}; extend_block_1([], _, Acc) -> {Acc,[]}. %% split_block([Instruction], Destination, FailLabel, [PreInstruction], %% ProhibitFailLabelInPreBlock) -> failed | {Block,PreBlock} %% Split a sequence of instructions into two blocks - one containing %% all guard bif instructions and a pre-block all instructions before %% the guard BIFs. split_block(Is0, Dst, Fail, PreIs, ProhibitFailLabel) -> case ProhibitFailLabel andalso beam_jump:is_label_used_in(Fail, PreIs) of true -> %% The failure label was used in one of the instructions (most %% probably bit syntax construction) preceeding the block, %% the caller might eliminate the label. failed; false -> case reverse(Is0) of [{set,[Dst],_,_}|_]=Is -> split_block_1(Is, Fail, ProhibitFailLabel); _ -> failed end end. split_block_1(Is, Fail, ProhibitFailLabel) -> case split_block_2(Is, Fail, []) of {[],_} -> failed; {_,PreBlock}=Res -> case ProhibitFailLabel andalso split_block_label_used(PreBlock, Fail) of true -> %% The failure label was used in the pre-block; %% not allowed, because the label may be removed. failed; false -> Res end end. split_block_2([{set,[_],_,{bif,_,{f,Fail}}}=I|Is], Fail, Acc) -> split_block_2(Is, Fail, [I|Acc]); split_block_2([{set,[_],_,{alloc,_,{gc_bif,_,{f,Fail}}}}=I|Is], Fail, Acc) -> split_block_2(Is, Fail, [I|Acc]); split_block_2(Is0, _, Acc) -> Is = reverse(Is0), {Acc,Is}. split_block_label_used([{set,[_],_,{bif,_,{f,Fail}}}|_], Fail) -> true; split_block_label_used([{set,[_],_,{alloc,_,{gc_bif,_,{f,Fail}}}}|_], Fail) -> true; split_block_label_used([{set,[_],_,{alloc,_,{put_map,_,{f,Fail}}}}|_], Fail) -> true; split_block_label_used([_|Is], Fail) -> split_block_label_used(Is, Fail); split_block_label_used([], _) -> false. dst_regs(Is) -> dst_regs(Is, []). dst_regs([{block,Bl}|Is], Acc) -> dst_regs(Bl, dst_regs(Is, Acc)); dst_regs([{set,[D],_,{bif,_,{f,_}}}|Is], Acc) -> dst_regs(Is, [D|Acc]); dst_regs([{set,[D],_,{alloc,_,{gc_bif,_,{f,_}}}}|Is], Acc) -> dst_regs(Is, [D|Acc]); dst_regs([{protected,_,Bl,_}|Is], Acc) -> dst_regs(Bl, dst_regs(Is, Acc)); dst_regs([_|Is], Acc) -> dst_regs(Is, Acc); dst_regs([], Acc) -> ordsets:from_list(Acc). all_killed([R|Rs], OldIs, Fail, St) -> case is_killed(R, OldIs, Fail, St) of false -> false; true -> all_killed(Rs, OldIs, Fail, St) end; all_killed([], _, _, _) -> true. none_used([R|Rs], OldIs, Fail, St) -> case is_not_used(R, OldIs, Fail, St) of false -> false; true -> none_used(Rs, OldIs, Fail, St) end; none_used([], _, _, _) -> true. bopt_tree_cg(Block0, Fail, St) -> Free = free_variables(Block0), Block = ssa_block(Block0), %% io:format("~p\n", [Block0]), %% io:format("~p\n", [Block]), %% io:format("~p\n", [gb_trees:to_list(Free)]), case bopt_tree(Block, Free, []) of {Pre0,[{_,Tree}]} -> Pre1 = update_fail_label(Pre0, Fail, []), Regs0 = init_regs(gb_trees:keys(Free)), %% io:format("~p\n", [dst_regs(Block0)]), %% io:format("~p\n", [Pre1]), %% io:format("~p\n", [Tree]), %% io:nl(), {Pre,Regs} = rename_regs(Pre1, Regs0), %% io:format("~p\n", [Regs0]), %% io:format("~p\n", [Pre]), bopt_cg(Tree, Fail, Regs, make_block(Pre), St); _Res -> throw(not_boolean_expr) end. bopt_tree([{set,[Dst],As0,{bif,'not',_}}|Is], Forest0, Pre) -> {[Arg],Forest1} = bopt_bool_args(As0, Forest0), Forest = gb_trees:enter(Dst, {'not',Arg}, Forest1), bopt_tree(Is, Forest, Pre); bopt_tree([{set,[Dst],As0,{bif,'and',_}}|Is], Forest0, Pre) -> {As,Forest1} = bopt_bool_args(As0, Forest0), Node = make_and_node(As), Forest = gb_trees:enter(Dst, Node, Forest1), bopt_tree(Is, Forest, Pre); bopt_tree([{set,[Dst],As0,{bif,'or',_}}|Is], Forest0, Pre) -> {As,Forest1} = bopt_bool_args(As0, Forest0), Node = make_or_node(As), Forest = gb_trees:enter(Dst, Node, Forest1), bopt_tree(Is, Forest, Pre); bopt_tree([{set,_,_,{bif,'xor',_}}|_], _, _) -> throw('xor'); bopt_tree([{protected,[Dst],Code,_}|Is], Forest0, Pre) -> ProtForest0 = gb_trees:from_orddict([P || {_,any}=P <- gb_trees:to_list(Forest0)]), case bopt_tree(Code, ProtForest0, []) of {ProtPre,[{_,ProtTree}]} -> Prot = {prot,ProtPre,ProtTree}, Forest = gb_trees:enter(Dst, Prot, Forest0), bopt_tree(Is, Forest, Pre); _Res -> throw(not_boolean_expr) end; bopt_tree([{set,[Dst],As,{bif,N,_}}=Bif|Is], Forest0, Pre) -> Ar = length(As), case safe_bool_op(N, Ar) of false -> bopt_good_args(As, Forest0), Forest = gb_trees:enter(Dst, any, Forest0), bopt_tree(Is, Forest, [Bif|Pre]); true -> bopt_good_args(As, Forest0), Test = bif_to_test(Dst, N, As), Forest = gb_trees:enter(Dst, Test, Forest0), bopt_tree(Is, Forest, Pre) end; bopt_tree([{set,[Dst],As,{alloc,_,{gc_bif,_,_}}}=Bif|Is], Forest0, Pre) -> bopt_good_args(As, Forest0), Forest = gb_trees:enter(Dst, any, Forest0), bopt_tree(Is, Forest, [Bif|Pre]); bopt_tree([], Forest, Pre) -> {reverse(Pre),[R || {_,V}=R <- gb_trees:to_list(Forest), V =/= any]}. safe_bool_op(N, Ar) -> erl_internal:new_type_test(N, Ar) orelse erl_internal:comp_op(N, Ar). bopt_bool_args([V0,V0], Forest0) -> {V,Forest} = bopt_bool_arg(V0, Forest0), {[V,V],Forest}; bopt_bool_args(As, Forest) -> mapfoldl(fun bopt_bool_arg/2, Forest, As). bopt_bool_arg({T,_}=R, Forest) when T =:= x; T =:= y; T =:= tmp -> Val = case gb_trees:lookup(R, Forest) of {value,any} -> {test,is_eq_exact,fail,[R,{atom,true}]}; {value,Val0} -> Val0; none -> throw(mixed) end, {Val,gb_trees:delete(R, Forest)}; bopt_bool_arg(Term, Forest) -> {Term,Forest}. bopt_good_args([A|As], Regs) -> bopt_good_arg(A, Regs), bopt_good_args(As, Regs); bopt_good_args([], _) -> ok. bopt_good_arg({Tag,_}=X, Regs) when Tag =:= x; Tag =:= tmp -> case gb_trees:lookup(X, Regs) of {value,any} -> ok; {value,_} -> throw(mixed); none -> throw(protected_barrier) end; bopt_good_arg(_, _) -> ok. bif_to_test(_, N, As) -> beam_utils:bif_to_test(N, As, fail). make_and_node(Is) -> AndList0 = make_and_list(Is), case simplify_and_list(AndList0) of [] -> {atom,true}; [Op] -> Op; AndList -> {'and',AndList} end. make_and_list([{'and',As}|Is]) -> make_and_list(As++Is); make_and_list([I|Is]) -> [I|make_and_list(Is)]; make_and_list([]) -> []. simplify_and_list([{atom,true}|T]) -> simplify_and_list(T); simplify_and_list([{atom,false}=False|_]) -> [False]; simplify_and_list([H|T]) -> [H|simplify_and_list(T)]; simplify_and_list([]) -> []. make_or_node(Is) -> OrList0 = make_or_list(Is), case simplify_or_list(OrList0) of [] -> {atom,false}; [Op] -> Op; OrList -> {'or',OrList} end. make_or_list([{'or',As}|Is]) -> make_or_list(As++Is); make_or_list([I|Is]) -> [I|make_or_list(Is)]; make_or_list([]) -> []. simplify_or_list([{atom,false}|T]) -> simplify_or_list(T); simplify_or_list([{atom,true}=True|_]) -> [True]; simplify_or_list([H|T]) -> [H|simplify_or_list(T)]; simplify_or_list([]) -> []. %% Code generation for a boolean tree. bopt_cg({'not',Arg}, Fail, Rs, Acc, St) -> I = bopt_cg_not(Arg), bopt_cg(I, Fail, Rs, Acc, St); bopt_cg({'and',As}, Fail, Rs, Acc, St) -> bopt_cg_and(As, Fail, Rs, Acc, St); bopt_cg({'or',As}, Fail, Rs, Acc, St0) -> {Succ,St} = new_label(St0), bopt_cg_or(As, Succ, Fail, Rs, Acc, St); bopt_cg({test,N,fail,As0}, Fail, Rs, Acc, St) -> As = rename_sources(As0, Rs), Test = {test,N,{f,Fail},As}, {[Test|Acc],St}; bopt_cg({inverted_test,N,fail,As0}, Fail, Rs, Acc, St0) -> As = rename_sources(As0, Rs), {Lbl,St} = new_label(St0), {[{label,Lbl},{jump,{f,Fail}},{test,N,{f,Lbl},As}|Acc],St}; bopt_cg({prot,Pre0,Tree}, Fail, Rs0, Acc, St0) -> Pre1 = update_fail_label(Pre0, Fail, []), {Pre,Rs} = rename_regs(Pre1, Rs0), bopt_cg(Tree, Fail, Rs, make_block(Pre, Acc), St0); bopt_cg({atom,true}, _Fail, _Rs, Acc, St) -> {Acc,St}; bopt_cg({atom,false}, Fail, _Rs, Acc, St) -> {[{jump,{f,Fail}}|Acc],St}; bopt_cg(_, _, _, _, _) -> throw(not_boolean_expr). bopt_cg_not({'and',As0}) -> As = [bopt_cg_not(A) || A <- As0], {'or',As}; bopt_cg_not({'or',As0}) -> As = [bopt_cg_not(A) || A <- As0], {'and',As}; bopt_cg_not({'not',Arg}) -> bopt_cg_not_not(Arg); bopt_cg_not({test,Test,Fail,As}) -> {inverted_test,Test,Fail,As}; bopt_cg_not({atom,Bool}) when is_boolean(Bool) -> {atom,not Bool}; bopt_cg_not(_) -> throw(not_boolean_expr). bopt_cg_not_not({'and',As}) -> {'and',[bopt_cg_not_not(A) || A <- As]}; bopt_cg_not_not({'or',As}) -> {'or',[bopt_cg_not_not(A) || A <- As]}; bopt_cg_not_not({'not',Arg}) -> bopt_cg_not(Arg); bopt_cg_not_not(Leaf) -> Leaf. bopt_cg_and([I|Is], Fail, Rs, Acc0, St0) -> {Acc,St} = bopt_cg(I, Fail, Rs, Acc0, St0), bopt_cg_and(Is, Fail, Rs, Acc, St); bopt_cg_and([], _, _, Acc, St) -> {Acc,St}. bopt_cg_or([I], Succ, Fail, Rs, Acc0, St0) -> {Acc,St} = bopt_cg(I, Fail, Rs, Acc0, St0), {[{label,Succ}|Acc],St}; bopt_cg_or([I|Is], Succ, Fail, Rs, Acc0, St0) -> {Lbl,St1} = new_label(St0), {Acc,St} = bopt_cg(I, Lbl, Rs, Acc0, St1), bopt_cg_or(Is, Succ, Fail, Rs, [{label,Lbl},{jump,{f,Succ}}|Acc], St). new_label(#st{next=LabelNum}=St) when is_integer(LabelNum) -> {LabelNum,St#st{next=LabelNum+1}}. free_variables(Is) -> E = gb_sets:empty(), free_vars_1(Is, E, E, E). free_vars_1([{set,Ds,As,{bif,_,_}}|Is], F0, N0, A) -> F = gb_sets:union(F0, gb_sets:difference(var_list(As), N0)), N = gb_sets:union(N0, var_list(Ds)), free_vars_1(Is, F, N, A); free_vars_1([{set,Ds,As,{alloc,Regs,{gc_bif,_,_}}}|Is], F0, N0, A0) -> A = gb_sets:union(A0, gb_sets:from_list(free_vars_regs(Regs))), F = gb_sets:union(F0, gb_sets:difference(var_list(As), N0)), N = gb_sets:union(N0, var_list(Ds)), free_vars_1(Is, F, N, A); free_vars_1([{protected,_,Pa,_}|Is], F, N, A) -> free_vars_1(Pa++Is, F, N, A); free_vars_1([], F0, N, A) -> F = case gb_sets:is_empty(A) of true -> %% No GC BIFs. {x,X} = gb_sets:smallest(N), P = ordsets:from_list(free_vars_regs(X)), ordsets:union(gb_sets:to_list(F0), P); false -> %% At least one GC BIF. gb_sets:to_list(gb_sets:union(F0, gb_sets:difference(A, N))) end, gb_trees:from_orddict([{K,any} || K <- F]). var_list(Is) -> var_list_1(Is, gb_sets:empty()). var_list_1([{Tag,_}=X|Is], D) when Tag =:= x; Tag =:= y -> var_list_1(Is, gb_sets:add(X, D)); var_list_1([_|Is], D) -> var_list_1(Is, D); var_list_1([], D) -> D. free_vars_regs(0) -> []; free_vars_regs(X) -> [{x,X-1}|free_vars_regs(X-1)]. rename_regs(Is, Regs) -> rename_regs(Is, Regs, []). rename_regs([{set,[Dst0],Ss0,{alloc,_,Info}}|Is], Regs0, Acc) -> Live = live_regs(Regs0), Ss = rename_sources(Ss0, Regs0), Regs = put_reg(Dst0, Regs0), Dst = fetch_reg(Dst0, Regs), rename_regs(Is, Regs, [{set,[Dst],Ss,{alloc,Live,Info}}|Acc]); rename_regs([{set,[Dst0],Ss0,Info}|Is], Regs0, Acc) -> Ss = rename_sources(Ss0, Regs0), Regs = put_reg(Dst0, Regs0), Dst = fetch_reg(Dst0, Regs), rename_regs(Is, Regs, [{set,[Dst],Ss,Info}|Acc]); rename_regs([], Regs, Acc) -> {reverse(Acc),Regs}. rename_sources(Ss, Regs) -> map(fun({x,_}=R) -> fetch_reg(R, Regs); ({tmp,_}=R) -> fetch_reg(R, Regs); (E) -> E end, Ss). %%% %%% Keeping track of register assignments. %%% init_regs(Free) -> init_regs_1(Free, 0). init_regs_1([{x,I}=V|T], I) -> [{I,V}|init_regs_1(T, I+1)]; init_regs_1([{x,X}|_]=T, I) when I < X -> [{I,reserved}|init_regs_1(T, I+1)]; init_regs_1([{y,_}|_], _) -> []; init_regs_1([], _) -> []. put_reg(V, Rs) -> put_reg_1(V, Rs, 0). put_reg_1(V, [R|Rs], I) -> [R|put_reg_1(V, Rs, I+1)]; put_reg_1(V, [], I) -> [{I,V}]. fetch_reg(V, [{I,V}|_]) -> {x,I}; fetch_reg(V, [_|SRs]) -> fetch_reg(V, SRs). live_regs([{_,reserved}|_]) -> %% We are not sure that this register is initialized, so we must %% abort the optimization. throw(gc_bif_alloc_failure); live_regs([{I,_}]) -> I+1; live_regs([{_,_}|Regs]) -> live_regs(Regs); live_regs([]) -> 0. %%% %%% Convert a block to Static Single Assignment (SSA) form. %%% -record(ssa, {live=0, %Variable counter. sub=gb_trees:empty(), %Substitution table. prot=gb_sets:empty(), %Targets assigned by protecteds. in_prot=false %Inside a protected. }). ssa_block(Is0) -> {Is,_} = ssa_block_1(Is0, #ssa{}, []), Is. ssa_block_1([{protected,[_],Pa0,Pb}|Is], Sub0, Acc) -> {Pa,Sub1} = ssa_block_1(Pa0, Sub0#ssa{in_prot=true}, []), Dst = ssa_last_target(Pa), Sub = Sub1#ssa{prot=gb_sets:insert(Dst, Sub1#ssa.prot), in_prot=Sub0#ssa.in_prot}, ssa_block_1(Is, Sub, [{protected,[Dst],Pa,Pb}|Acc]); ssa_block_1([{set,[Dst],As,Bif}|Is], Sub0, Acc0) -> Sub1 = ssa_in_use_list(As, Sub0), Sub = ssa_assign(Dst, Sub1), Acc = [{set,[ssa_sub(Dst, Sub)],ssa_sub_list(As, Sub0),Bif}|Acc0], ssa_block_1(Is, Sub, Acc); ssa_block_1([], Sub, Acc) -> {reverse(Acc),Sub}. ssa_in_use_list(As, Sub) -> foldl(fun ssa_in_use/2, Sub, As). ssa_in_use({x,_}=R, #ssa{sub=Sub0}=Ssa) -> case gb_trees:is_defined(R, Sub0) of true -> Ssa; false -> Sub = gb_trees:insert(R, R, Sub0), Ssa#ssa{sub=Sub} end; ssa_in_use(_, Ssa) -> Ssa. ssa_assign({x,_}=R, #ssa{sub=Sub0}=Ssa0) -> {NewReg,Ssa} = ssa_new_reg(Ssa0), case gb_trees:is_defined(R, Sub0) of false -> Sub = gb_trees:insert(R, NewReg, Sub0), Ssa#ssa{sub=Sub}; true -> Sub1 = gb_trees:update(R, NewReg, Sub0), Sub = gb_trees:insert(NewReg, NewReg, Sub1), Ssa#ssa{sub=Sub} end. ssa_sub_list(List, Sub) -> [ssa_sub(E, Sub) || E <- List]. ssa_sub(R0, #ssa{sub=Sub,prot=Prot,in_prot=InProt}) -> case gb_trees:lookup(R0, Sub) of none -> R0; {value,R} -> case InProt andalso gb_sets:is_element(R, Prot) of true -> throw(protected_violation); false -> R end end. ssa_new_reg(#ssa{live=Reg}=Ssa) -> {{tmp,Reg},Ssa#ssa{live=Reg+1}}. ssa_last_target([{set,[Dst],_,_}]) -> Dst; ssa_last_target([_|Is]) -> ssa_last_target(Is). %% is_killed(Register, [Instruction], FailLabel, State) -> true|false %% Determine whether a register is killed in the instruction sequence. %% The state is used to allow us to determine the kill state %% across branches. is_killed(R, Is, Label, #st{ll=Ll}) -> beam_utils:is_killed(R, Is, Ll) andalso beam_utils:is_killed_at(R, Label, Ll). %% is_not_used(Register, [Instruction], FailLabel, State) -> true|false %% Determine whether a register is never used in the instruction sequence %% (it could still referenced by an allocate instruction, meaning that %% it MUST be initialized). %% The state is used to allow us to determine the usage state %% across branches. is_not_used(R, Is, Label, #st{ll=Ll}) -> beam_utils:is_not_used(R, Is, Ll) andalso beam_utils:is_not_used_at(R, Label, Ll). %% initialized_regs([Instruction]) -> [Register]) %% Given a REVERSED instruction sequence, return a list of the registers %% that are guaranteed to be initialized (not contain garbage). initialized_regs(Is) -> initialized_regs(Is, ordsets:new()). initialized_regs([{set,Dst,_Src,{alloc,Live,_}}|_], Regs0) -> Regs = add_init_regs(free_vars_regs(Live), Regs0), add_init_regs(Dst, Regs); initialized_regs([{set,Dst,Src,_}|Is], Regs) -> initialized_regs(Is, add_init_regs(Dst, add_init_regs(Src, Regs))); initialized_regs([{test,_,_,Src}|Is], Regs) -> initialized_regs(Is, add_init_regs(Src, Regs)); initialized_regs([{block,Bl}|Is], Regs) -> initialized_regs(reverse(Bl, Is), Regs); initialized_regs([{bs_context_to_binary,Src}|Is], Regs) -> initialized_regs(Is, add_init_regs([Src], Regs)); initialized_regs([{label,_},{func_info,_,_,Arity}|_], Regs) -> InitRegs = free_vars_regs(Arity), add_init_regs(InitRegs, Regs); initialized_regs([_|_], Regs) -> Regs. add_init_regs([{x,_}=X|T], Regs) -> add_init_regs(T, ordsets:add_element(X, Regs)); add_init_regs([_|T], Regs) -> add_init_regs(T, Regs); add_init_regs([], Regs) -> Regs.