mirror of
https://github.com/Mercury-Language/mercury.git
synced 2026-04-15 01:13:30 +00:00
compiler/hlds_goal.m:
Document that all goals inside from_ground_term_deconstruct scopes
are not just unifications, but unifications whose right hand sides
are rhs_functors.
compiler/constraint.m:
Fix a potential problem, which is that pushing a constraint into
from_ground_term_{deconstruct,other) scopes can invalidate
their invariants.
compiler/goal_refs.m:
Fix a comment.
compiler/lco.m:
Qualify a call.
compiler/modecheck_goal.m:
Fix a misleading predicate name, and typos.
compiler/try_expand.m:
Exploit the newly-documented invariant about from_ground_term_deconstruct
scopes.
2089 lines
87 KiB
Mathematica
2089 lines
87 KiB
Mathematica
%---------------------------------------------------------------------------%
|
|
% vim: ft=mercury ts=4 sw=4 et
|
|
%---------------------------------------------------------------------------%
|
|
% Copyright (C) 1996-2012 The University of Melbourne.
|
|
% Copyright (C) 2013-2026 The Mercury team.
|
|
% This file may only be copied under the terms of the GNU General
|
|
% Public License - see the file COPYING in the Mercury distribution.
|
|
%---------------------------------------------------------------------------%
|
|
%
|
|
% File: lco.m.
|
|
% Author: zs.
|
|
% Modifications by wangp.
|
|
%
|
|
% Transform predicates with calls that are tail recursive modulo construction
|
|
% where (1) all recursive calls have the same args participating in the "modulo
|
|
% construction" part and (2) all the other output args are returned in the same
|
|
% registers in all recursive calls as expected by the head.
|
|
%
|
|
% p(In1, ... InN, Out1, ... OutM) :-
|
|
% Out1 = ground
|
|
% p(In1, ... InN, Out1, ... OutM) :-
|
|
% ...
|
|
% p(In1, ... InN, Mid1, Out2... OutM)
|
|
% Out1 = f1(...Mid1...)
|
|
%
|
|
% The definition of append fits this pattern:
|
|
%
|
|
% app(list(T)::in, list(T)::in, list(T)::out)
|
|
% app(A, B, C) :-
|
|
% (
|
|
% A == [],
|
|
% C := B
|
|
% ;
|
|
% A => [H | T],
|
|
% app(T, B, NT),
|
|
% C <= [H | NT]
|
|
% )
|
|
%
|
|
%---------------------------------------------------------------------------%
|
|
%
|
|
% TRANSFORMATION FOR LOW-LEVEL DATA
|
|
%
|
|
% Concrete example of what the original predicate and its return-via-memory
|
|
% variant should look like for append, in grades for which it is possible to
|
|
% take the address of a field:
|
|
%
|
|
% app(list(T)::in, list(T)::in, list(T)::out)
|
|
% app(A, B, C) :-
|
|
% (
|
|
% A == [],
|
|
% C := B
|
|
% ;
|
|
% A => [H | T],
|
|
% C <= [H | _HT] capture &HT in AddrHT
|
|
% app'(T, B, AddrHT)
|
|
% )
|
|
%
|
|
% app'(list(T)::in, list(T)::in, store_at_ref_type(T)::in)
|
|
% app'(A, B, AddrC) :-
|
|
% (
|
|
% A == [],
|
|
% C := B,
|
|
% store_at_ref_impure(AddrC, C)
|
|
% ;
|
|
% A => [H | T],
|
|
% C <= [H | _HT] capture &HT in AddrHT
|
|
% store_at_ref_impure(AddrC, C)
|
|
% app'(T, B, AddrHT)
|
|
% )
|
|
%
|
|
% The transformation done on the original predicate is to take recursive calls
|
|
% followed by construction unifications that use outputs of the recursive calls
|
|
% (each being used just once) and
|
|
%
|
|
% 1 move the constructions from after the recursive call to before, and attach
|
|
% a feature to them that tells the code generator to not define a given list
|
|
% of fields, but to capture their addresses in the related variable instead,
|
|
%
|
|
% 2 make the call go to the variant, and pass the address variables (e.g.
|
|
% AddrHT) as inputs instead of the original variables (e.g. HT) as outputs.
|
|
%
|
|
% The variant predicate is based on the transformed version of the original
|
|
% predicate, but it has a further transformation performed on it. This further
|
|
% transformation
|
|
%
|
|
% 3 replaces the output arguments with input arguments of type
|
|
% store_at_ref_type(T), where T is type of the field pointed to, and
|
|
%
|
|
% 4 calls to other procedures in the same SCC that are tail calls module
|
|
% constructors are replaced by calls to variants where possible, and
|
|
%
|
|
% 5 follows each primitive goal that binds one of the output arguments
|
|
% with a store to the memory location indicated by the corresponding pointer.
|
|
%
|
|
% p(In1, ... InN, Out1, ... OutM) :-
|
|
% Out1 = ground
|
|
% p(In1, ... InN, Out1, ... OutM) :-
|
|
% ...
|
|
% Out1 = f1(...Mid1...)
|
|
% capture addr of Mid1 in AddrMid1
|
|
% p'(In1, ... InN, AddrMid1, Out2... OutM)
|
|
%
|
|
% p'(In1, ... InN, RefOut1, ... OutM) :-
|
|
% Out1 = ground,
|
|
% store_at_ref_impure(RefOut1, Out1)
|
|
% p'(In1, ... InN, RefOut1, Out2... OutM) :-
|
|
% ...
|
|
% Out1 = f1(...Mid1...)
|
|
% capture addr of Mid1 in AddrMid1
|
|
% store_at_ref_impure(RefOut1, Out1)
|
|
% p'(In1, ... InN, AddrMid1, Out2... OutM)
|
|
%
|
|
%---------------------------------------------------------------------------%
|
|
%
|
|
% TRANSFORMATION FOR HIGH-LEVEL DATA
|
|
%
|
|
% In grades where it is impossible to take the address of a field (we assume
|
|
% this is so when using --highlevel-data), the transformed procedures are
|
|
% passed partially instantiated cells, whose holes need to be filled.
|
|
% The append example looks like:
|
|
%
|
|
% app(list(T)::in, list(T)::in, list(T)::out)
|
|
% app(A, B, C) :-
|
|
% (
|
|
% A == [],
|
|
% C := B
|
|
% ;
|
|
% A => [H | T],
|
|
% C <= [H | _], % with hole
|
|
% app'(T, B, C)
|
|
% )
|
|
%
|
|
% app'(list(T)::in, list(T)::in, T::in(bound('[|]'(ground, free))))
|
|
% app'(A, B, C) :-
|
|
% (
|
|
% A == [],
|
|
% C => [_ | []] % fill in hole
|
|
% ;
|
|
% A => [H | T],
|
|
% C <= [H | _HT], % bind C to AddrC
|
|
% app'(T, B, AddrC)
|
|
% )
|
|
%
|
|
% The differences are:
|
|
%
|
|
% 1 The output arguments become partially instantiated input arguments
|
|
% instead of store_at_ref_type(T) arguments.
|
|
%
|
|
% 2 The holes in the output arguments are filled in with unifications
|
|
% instead of a store_at_ref_impure builtin.
|
|
%
|
|
% 3 Variant procedures need to know the functor and position of the argument in
|
|
% the partially instantiated structures, so many more variants could be
|
|
% produced. The number of variants is capped.
|
|
%
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- module transform_hlds.lco.
|
|
:- interface.
|
|
|
|
:- import_module hlds.
|
|
:- import_module hlds.hlds_module.
|
|
|
|
:- pred lco_modulo_constructors(module_info::in, module_info::out) is det.
|
|
|
|
%---------------------------------------------------------------------------%
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- implementation.
|
|
|
|
:- import_module check_hlds.
|
|
:- import_module check_hlds.recompute_instmap_deltas.
|
|
:- import_module hlds.arg_info.
|
|
:- import_module hlds.goal_util.
|
|
:- import_module hlds.goal_vars.
|
|
:- import_module hlds.hlds_data.
|
|
:- import_module hlds.hlds_dependency_graph.
|
|
:- import_module hlds.hlds_goal.
|
|
:- import_module hlds.hlds_out.
|
|
:- import_module hlds.hlds_out.hlds_out_goal.
|
|
:- import_module hlds.hlds_pred.
|
|
:- import_module hlds.hlds_proc_util.
|
|
:- import_module hlds.inst_lookup.
|
|
:- import_module hlds.inst_test.
|
|
:- import_module hlds.instmap.
|
|
:- import_module hlds.mode_top_functor.
|
|
:- import_module hlds.passes_aux.
|
|
:- import_module hlds.pred_name.
|
|
:- import_module hlds.pred_table.
|
|
:- import_module hlds.quantification.
|
|
:- import_module hlds.status.
|
|
:- import_module hlds.type_util.
|
|
:- import_module libs.
|
|
:- import_module libs.dependency_graph.
|
|
:- import_module libs.globals.
|
|
:- import_module libs.options.
|
|
:- import_module mdbcomp.
|
|
:- import_module mdbcomp.builtin_modules.
|
|
:- import_module mdbcomp.prim_data.
|
|
:- import_module mdbcomp.sym_name.
|
|
:- import_module parse_tree.
|
|
:- import_module parse_tree.builtin_lib_types.
|
|
:- import_module parse_tree.parse_tree_out_cons_id.
|
|
:- import_module parse_tree.parse_tree_out_info.
|
|
:- import_module parse_tree.parse_tree_out_term.
|
|
:- import_module parse_tree.prog_data.
|
|
:- import_module parse_tree.prog_mode.
|
|
:- import_module parse_tree.prog_rename.
|
|
:- import_module parse_tree.prog_type.
|
|
:- import_module parse_tree.prog_util.
|
|
:- import_module parse_tree.set_of_var.
|
|
:- import_module parse_tree.var_db.
|
|
:- import_module parse_tree.var_table.
|
|
|
|
:- import_module assoc_list.
|
|
:- import_module bag.
|
|
:- import_module bool.
|
|
:- import_module cord.
|
|
:- import_module int.
|
|
:- import_module io.
|
|
:- import_module list.
|
|
:- import_module map.
|
|
:- import_module maybe.
|
|
:- import_module multi_map.
|
|
:- import_module pair.
|
|
:- import_module require.
|
|
:- import_module set.
|
|
:- import_module string.
|
|
:- import_module term_context.
|
|
:- import_module varset.
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- type variant_id
|
|
---> variant_id(
|
|
list(variant_arg), % The output arguments returned in memory.
|
|
pred_proc_id, % The id of the variant.
|
|
sym_name % The sym_name of the variant predicate.
|
|
).
|
|
|
|
:- type variant_arg
|
|
---> variant_arg(
|
|
% Position of the output argument. The first output argument
|
|
% is 1, the second is 2, and so on, without counting input
|
|
% arguments.
|
|
va_pos :: int,
|
|
|
|
% For low-level data, this field should be `no'.
|
|
% For high-level data, this field should be `yes(FieldId)'
|
|
% where FieldId indicates the functor that the argument
|
|
% will be bound to, and the argument of that functor
|
|
% which is to be filled.
|
|
va_field :: maybe(field_id)
|
|
).
|
|
|
|
% Materialize this automatically defined field access function,
|
|
% so we can pass it to higher order code.
|
|
%
|
|
:- func va_pos(variant_arg) = int.
|
|
|
|
:- type field_id
|
|
---> field_id(
|
|
fi_type :: mer_type,
|
|
fi_cons_id :: cons_id,
|
|
fi_arg :: int
|
|
).
|
|
|
|
:- type variant_map == multi_map(pred_proc_id, variant_id).
|
|
|
|
:- type lco_is_permitted_on_scc
|
|
---> lco_is_not_permitted_on_scc
|
|
; lco_is_permitted_on_scc.
|
|
|
|
:- type proc_changed
|
|
---> proc_not_changed
|
|
; proc_changed.
|
|
|
|
:- type allow_float_addr
|
|
---> do_not_allow_float_addr
|
|
; allow_float_addr.
|
|
|
|
:- type lco_info
|
|
---> lco_info(
|
|
lco_module_info :: module_info,
|
|
lco_cur_scc_variants :: variant_map,
|
|
lco_var_table :: var_table,
|
|
lco_permitted :: lco_is_permitted_on_scc,
|
|
lco_changed :: proc_changed
|
|
).
|
|
|
|
:- type lco_const_info
|
|
---> lco_const_info(
|
|
lci_lower_scc_variants :: variant_map,
|
|
lci_cur_scc :: set(pred_proc_id),
|
|
lci_cur_proc_id :: pred_proc_id,
|
|
lci_cur_proc_pred :: pred_info,
|
|
lci_cur_proc_proc :: proc_info,
|
|
lci_cur_proc_outputs :: list(prog_var),
|
|
lci_cur_proc_detism :: determinism,
|
|
lci_allow_float_addr :: allow_float_addr,
|
|
lci_highlevel_data :: bool
|
|
).
|
|
|
|
:- type var_to_target == assoc_list(prog_var, store_target).
|
|
|
|
:- type store_target
|
|
---> store_target(
|
|
prog_var,
|
|
maybe(field_id)
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
lco_modulo_constructors(!ModuleInfo) :-
|
|
module_info_rebuild_dependency_info(!ModuleInfo, DepInfo),
|
|
SCCs = dependency_info_get_bottom_up_sccs(DepInfo),
|
|
list.foldl2(lco_scc, SCCs, map.init, _, !ModuleInfo).
|
|
|
|
:- pred lco_scc(set(pred_proc_id)::in, variant_map::in, variant_map::out,
|
|
module_info::in, module_info::out) is det.
|
|
|
|
lco_scc(SCC, VariantMap, VariantMap, !ModuleInfo) :-
|
|
% XXX Did we forget to add CurSCCVariants to !VariantMap? Yes, we did.
|
|
ModuleInfo0 = !.ModuleInfo,
|
|
set.foldl4(lco_proc_if_permitted(VariantMap, SCC), SCC, !ModuleInfo,
|
|
map.init, CurSCCVariantMap, map.init, CurSCCUpdateMap,
|
|
lco_is_permitted_on_scc, Permitted),
|
|
multi_map.to_flat_assoc_list(CurSCCVariantMap, CurSCCVariants),
|
|
map.to_assoc_list(CurSCCUpdateMap, CurSCCUpdates),
|
|
( if
|
|
Permitted = lco_is_permitted_on_scc,
|
|
CurSCCUpdates = [_ | _]
|
|
then
|
|
trace [compile_time(flag("lco_log_updates")), io(!IO)] (
|
|
io.open_append("/tmp/LCO_LOG", OpenResult, !IO),
|
|
(
|
|
OpenResult = ok(Stream),
|
|
io.write_string(Stream, "updating scc:\n", !IO),
|
|
list.foldl(lco_log_update(Stream, !.ModuleInfo),
|
|
CurSCCUpdates, !IO),
|
|
io.close_output(Stream, !IO)
|
|
;
|
|
OpenResult = error(_)
|
|
)
|
|
),
|
|
list.foldl(store_updated_procs_in_module_info, CurSCCUpdates,
|
|
!ModuleInfo),
|
|
list.foldl(update_variant_pred_info(CurSCCVariantMap), CurSCCVariants,
|
|
!ModuleInfo)
|
|
else
|
|
!:ModuleInfo = ModuleInfo0
|
|
).
|
|
|
|
:- pred lco_log_update(io.text_output_stream::in, module_info::in,
|
|
pair(pred_proc_id, proc_info)::in, io::di, io::uo) is det.
|
|
|
|
lco_log_update(Stream, ModuleInfo, PredProcId - _NewProcInfo, !IO) :-
|
|
PredProcId = proc(PredId, ProcId),
|
|
module_info_pred_info(ModuleInfo, PredId, PredInfo),
|
|
pred_info_get_module_name(PredInfo, ModuleName),
|
|
pred_info_get_name(PredInfo, PredName),
|
|
SymNameStr = sym_name_to_string(qualified(ModuleName, PredName)),
|
|
ProcIdInt = proc_id_to_int(ProcId),
|
|
io.format(Stream, " %s/%d\n", [s(SymNameStr), i(ProcIdInt)], !IO).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred lco_proc_if_permitted(variant_map::in, scc::in, pred_proc_id::in,
|
|
module_info::in, module_info::out, variant_map::in, variant_map::out,
|
|
map(pred_proc_id, proc_info)::in, map(pred_proc_id, proc_info)::out,
|
|
lco_is_permitted_on_scc::in, lco_is_permitted_on_scc::out) is det.
|
|
|
|
lco_proc_if_permitted(LowerSCCVariants, SCC, CurProc,
|
|
!ModuleInfo, !CurSCCVariants, !CurSCCUpdates, !Permitted) :-
|
|
(
|
|
!.Permitted = lco_is_not_permitted_on_scc
|
|
;
|
|
!.Permitted = lco_is_permitted_on_scc,
|
|
CurProc = proc(PredId, ProcId),
|
|
module_info_pred_proc_info(!.ModuleInfo, PredId, ProcId,
|
|
PredInfo, ProcInfo0),
|
|
pred_info_get_status(PredInfo, PredStatus),
|
|
DefInThisModule = pred_status_defined_in_this_module(PredStatus),
|
|
proc_info_get_inferred_determinism(ProcInfo0, Detism),
|
|
( if
|
|
DefInThisModule = yes,
|
|
acceptable_detism_for_lco(Detism) = yes
|
|
then
|
|
lco_proc(LowerSCCVariants, SCC, CurProc, PredInfo, ProcInfo0,
|
|
!ModuleInfo, !CurSCCVariants, !CurSCCUpdates, !:Permitted)
|
|
else
|
|
!:Permitted = lco_is_not_permitted_on_scc
|
|
)
|
|
).
|
|
|
|
:- pred lco_proc(variant_map::in, scc::in, pred_proc_id::in,
|
|
pred_info::in, proc_info::in,
|
|
module_info::in, module_info::out, variant_map::in, variant_map::out,
|
|
map(pred_proc_id, proc_info)::in, map(pred_proc_id, proc_info)::out,
|
|
lco_is_permitted_on_scc::out) is det.
|
|
|
|
lco_proc(LowerSCCVariants, SCC, CurProc, PredInfo, ProcInfo0,
|
|
!ModuleInfo, !CurSCCVariants, !CurSCCUpdates, !:Permitted) :-
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_debug_output_stream(!.ModuleInfo, DebugStream, !IO),
|
|
io.write_string(DebugStream, "\nlco_proc ", !IO),
|
|
io.write_line(DebugStream, CurProc, !IO),
|
|
io.flush_output(DebugStream, !IO)
|
|
),
|
|
proc_info_get_var_table(ProcInfo0, VarTable0),
|
|
proc_info_get_headvars(ProcInfo0, HeadVars),
|
|
proc_info_get_argmodes(ProcInfo0, ArgModes),
|
|
arg_info.compute_in_and_out_vars(!.ModuleInfo, VarTable0,
|
|
HeadVars, ArgModes, _InputHeadVars, OutputHeadVars),
|
|
proc_info_get_inferred_determinism(ProcInfo0, CurProcDetism),
|
|
module_info_get_globals(!.ModuleInfo, Globals),
|
|
globals.get_target(Globals, Target),
|
|
HighLevelData = compilation_target_high_level_data(Target),
|
|
globals.lookup_bool_option(Globals, unboxed_float, UnboxedFloat),
|
|
(
|
|
UnboxedFloat = no,
|
|
% In both C backends, we can and do store doubles across two words
|
|
% of a cell when sizeof(double) > sizeof(void *). However we are
|
|
% not yet ready to take the address of double-word fields
|
|
% nor to assign to them.
|
|
AllowFloatAddr = do_not_allow_float_addr
|
|
;
|
|
UnboxedFloat = yes,
|
|
AllowFloatAddr = allow_float_addr
|
|
),
|
|
ConstInfo = lco_const_info(LowerSCCVariants, SCC,
|
|
CurProc, PredInfo, ProcInfo0, OutputHeadVars, CurProcDetism,
|
|
AllowFloatAddr, HighLevelData),
|
|
Info0 = lco_info(!.ModuleInfo, !.CurSCCVariants, VarTable0,
|
|
lco_is_permitted_on_scc, proc_not_changed),
|
|
proc_info_get_goal(ProcInfo0, Goal0),
|
|
lco_in_goal(Goal0, Goal, Info0, Info, ConstInfo),
|
|
Info = lco_info(!:ModuleInfo, !:CurSCCVariants, VarTable,
|
|
!:Permitted, Changed),
|
|
( if
|
|
!.Permitted = lco_is_permitted_on_scc,
|
|
Changed = proc_changed
|
|
then
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_lco_debug_output_stream(Info, DebugStream, !IO),
|
|
pred_info_get_typevarset(PredInfo, TVarSet),
|
|
proc_info_get_inst_varset(ProcInfo0, InstVarSet),
|
|
io.write_string(DebugStream, "\ngoal before lco:\n", !IO),
|
|
dump_goal_nl(DebugStream, !.ModuleInfo, vns_var_table(VarTable),
|
|
TVarSet, InstVarSet, Goal0, !IO),
|
|
io.write_string(DebugStream, "\ngoal after lco:\n", !IO),
|
|
dump_goal_nl(DebugStream, !.ModuleInfo, vns_var_table(VarTable),
|
|
TVarSet, InstVarSet, Goal, !IO)
|
|
),
|
|
some [!ProcInfo] (
|
|
!:ProcInfo = ProcInfo0,
|
|
proc_info_set_var_table(VarTable, !ProcInfo),
|
|
proc_info_set_goal(Goal, !ProcInfo),
|
|
% See the comment in transform_call_and_unifies for why these
|
|
% are needed.
|
|
requantify_proc_general(ord_nl_no_lambda, !ProcInfo),
|
|
recompute_instmap_delta_proc(recomp_atomics,
|
|
!ProcInfo, !ModuleInfo),
|
|
map.det_insert(CurProc, !.ProcInfo, !CurSCCUpdates)
|
|
)
|
|
else
|
|
true
|
|
).
|
|
|
|
% Procedures which can succeed more than once can't do proper tail calls,
|
|
% and procedures that cannot succeed at all should not be optimized
|
|
% for time.
|
|
%
|
|
:- func acceptable_detism_for_lco(determinism) = bool.
|
|
|
|
acceptable_detism_for_lco(detism_det) = yes.
|
|
acceptable_detism_for_lco(detism_semi) = yes.
|
|
acceptable_detism_for_lco(detism_cc_multi) = yes.
|
|
acceptable_detism_for_lco(detism_cc_non) = yes.
|
|
acceptable_detism_for_lco(detism_multi) = no.
|
|
acceptable_detism_for_lco(detism_non) = no.
|
|
acceptable_detism_for_lco(detism_failure) = no.
|
|
acceptable_detism_for_lco(detism_erroneous) = no.
|
|
|
|
%---------------------------------------------------------------------------%
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred lco_in_goal(hlds_goal::in, hlds_goal::out, lco_info::in, lco_info::out,
|
|
lco_const_info::in) is det.
|
|
|
|
lco_in_goal(Goal0, Goal, !Info, ConstInfo) :-
|
|
Goal0 = hlds_goal(GoalExpr0, GoalInfo),
|
|
(
|
|
GoalExpr0 = conj(ConjType, Goals0),
|
|
(
|
|
ConjType = plain_conj,
|
|
lco_in_conj(Goals0, MaybeGoals, !Info, ConstInfo),
|
|
(
|
|
MaybeGoals = yes(Goals),
|
|
GoalExpr = conj(plain_conj, Goals)
|
|
;
|
|
MaybeGoals = no,
|
|
% If the top-level conjunction doesn't end with some
|
|
% unifications we can move before a recursive call,
|
|
% maybe it ends with a switch or if-then-else, some of whose
|
|
% arms fit that pattern.
|
|
( if list.split_last(Goals0, AllButLast, Last0) then
|
|
lco_in_goal(Last0, Last, !Info, ConstInfo),
|
|
GoalExpr = conj(plain_conj, AllButLast ++ [Last])
|
|
else
|
|
GoalExpr = GoalExpr0
|
|
)
|
|
)
|
|
;
|
|
ConjType = parallel_conj,
|
|
GoalExpr = GoalExpr0,
|
|
!Info ^ lco_permitted := lco_is_not_permitted_on_scc
|
|
)
|
|
;
|
|
GoalExpr0 = disj(Goals0),
|
|
% There is no point in looking for tail calls in the non-last
|
|
% disjuncts.
|
|
( if list.split_last(Goals0, AllButLast, Last0) then
|
|
lco_in_goal(Last0, Last, !Info, ConstInfo),
|
|
GoalExpr = disj(AllButLast ++ [Last])
|
|
else
|
|
GoalExpr = GoalExpr0
|
|
)
|
|
;
|
|
GoalExpr0 = switch(Var, CanFail, Cases0),
|
|
lco_in_cases(Cases0, Cases, !Info, ConstInfo),
|
|
GoalExpr = switch(Var, CanFail, Cases)
|
|
;
|
|
GoalExpr0 = if_then_else(Vars, Cond, Then0, Else0),
|
|
lco_in_goal(Then0, Then, !Info, ConstInfo),
|
|
lco_in_goal(Else0, Else, !Info, ConstInfo),
|
|
GoalExpr = if_then_else(Vars, Cond, Then, Else)
|
|
;
|
|
GoalExpr0 = scope(Reason, SubGoal0),
|
|
( if
|
|
Reason = from_ground_term(_, FGT),
|
|
( FGT = from_ground_term_construct
|
|
; FGT = from_ground_term_deconstruct
|
|
)
|
|
then
|
|
GoalExpr = GoalExpr0
|
|
else
|
|
lco_in_goal(SubGoal0, SubGoal, !Info, ConstInfo),
|
|
GoalExpr = scope(Reason, SubGoal)
|
|
)
|
|
;
|
|
( GoalExpr0 = negation(_)
|
|
; GoalExpr0 = generic_call(_, _, _, _, _)
|
|
; GoalExpr0 = plain_call(_, _, _, _, _, _)
|
|
; GoalExpr0 = unify(_, _, _, _, _)
|
|
; GoalExpr0 = call_foreign_proc(_, _, _, _, _, _, _)
|
|
),
|
|
GoalExpr = GoalExpr0
|
|
;
|
|
GoalExpr0 = shorthand(_),
|
|
% These should have been expanded out by now.
|
|
unexpected($pred, "shorthand")
|
|
),
|
|
Goal = hlds_goal(GoalExpr, GoalInfo).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred lco_in_cases(list(case)::in, list(case)::out,
|
|
lco_info::in, lco_info::out, lco_const_info::in) is det.
|
|
|
|
lco_in_cases([], [], !Info, _ConstInfo).
|
|
lco_in_cases([Case0 | Cases0], [Case | Cases], !Info, ConstInfo) :-
|
|
Case0 = case(MainConsId, OtherConsIds, Goal0),
|
|
lco_in_goal(Goal0, Goal, !Info, ConstInfo),
|
|
Case = case(MainConsId, OtherConsIds, Goal),
|
|
lco_in_cases(Cases0, Cases, !Info, ConstInfo).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
%---------------------------------------------------------------------------%
|
|
|
|
% lco_in_conj(Goals0, MaybeGoals, !Info, ConstInfo)
|
|
%
|
|
% Given a conjunction whose structure is:
|
|
%
|
|
% zero or more arbitrary goals
|
|
% recursive call that could be a last call modulo constructors
|
|
% one or more moveable goals
|
|
%
|
|
% move the moveable goals before the call.
|
|
% If successful, MaybeGoals is yes(Goals) with the goals in the new order.
|
|
% Otherwise MaybeGoals is no.
|
|
%
|
|
:- pred lco_in_conj(list(hlds_goal)::in, maybe(list(hlds_goal))::out,
|
|
lco_info::in, lco_info::out, lco_const_info::in) is det.
|
|
|
|
lco_in_conj(Goals0, MaybeGoals, !Info, ConstInfo) :-
|
|
list.reverse(Goals0, RevGoals0),
|
|
( if
|
|
divide_rev_conj(!.Info, ConstInfo, RevGoals0, [], AfterGoals,
|
|
RecGoal, RecOutArgs, RevBeforeGoals),
|
|
AfterGoals = [_ | _],
|
|
set_of_var.list_to_set(RecOutArgs, DelayForVars0),
|
|
list.foldl3(partition_dependent_goal(!.Info, ConstInfo), AfterGoals,
|
|
[], RevAfterDependentGoals,
|
|
[], RevAfterNonDependentGoals,
|
|
DelayForVars0, DelayForVars),
|
|
list.foldl(
|
|
acceptable_construct_unification(!.Info, ConstInfo, DelayForVars),
|
|
RevAfterDependentGoals, bag.init, UnifyInputVars)
|
|
then
|
|
list.reverse(RevAfterDependentGoals, UnifyGoals),
|
|
transform_call_and_unifies(RecGoal, RecOutArgs,
|
|
UnifyGoals, UnifyInputVars, MaybeGoals1, !Info, ConstInfo),
|
|
(
|
|
MaybeGoals1 = yes(UpdatedRecAndUnifies),
|
|
Goals = list.reverse(RevBeforeGoals)
|
|
++ list.reverse(RevAfterNonDependentGoals)
|
|
++ UpdatedRecAndUnifies,
|
|
MaybeGoals = yes(Goals)
|
|
;
|
|
MaybeGoals1 = no,
|
|
MaybeGoals = no
|
|
)
|
|
else
|
|
MaybeGoals = no
|
|
).
|
|
|
|
% Divide a conjunction into
|
|
% - a list of goals before the rightmost recursive call
|
|
% - the recursive call itself
|
|
% - the goals following the recursive call which could potentially be
|
|
% moved before the recursive call, using the LCMC transform if necessary.
|
|
%
|
|
% invariant:
|
|
% reverse(RevGoals0) ++ AfterGoals0
|
|
% = reverse(RevBeforeGoals) ++ [RecGoal] ++ AfterGoals
|
|
%
|
|
:- pred divide_rev_conj(lco_info::in, lco_const_info::in, list(hlds_goal)::in,
|
|
list(hlds_goal)::in, list(hlds_goal)::out,
|
|
hlds_goal::out, list(prog_var)::out, list(hlds_goal)::out) is semidet.
|
|
|
|
divide_rev_conj(Info, ConstInfo, RevGoals0, !AfterGoals, RecGoal, RecOutArgs,
|
|
RevBeforeGoals) :-
|
|
(
|
|
RevGoals0 = [],
|
|
% No recursive call found.
|
|
fail
|
|
;
|
|
RevGoals0 = [RevGoal | RevGoalsTail],
|
|
( if
|
|
potentially_transformable_recursive_call(Info, ConstInfo, RevGoal,
|
|
OutArgs)
|
|
then
|
|
RecGoal = RevGoal,
|
|
RecOutArgs = OutArgs,
|
|
RevBeforeGoals = RevGoalsTail
|
|
else if
|
|
potentially_moveable_goal(RevGoal)
|
|
then
|
|
!:AfterGoals = [RevGoal | !.AfterGoals],
|
|
divide_rev_conj(Info, ConstInfo, RevGoalsTail, !AfterGoals,
|
|
RecGoal, RecOutArgs, RevBeforeGoals)
|
|
else
|
|
fail
|
|
)
|
|
).
|
|
|
|
:- pred potentially_transformable_recursive_call(lco_info::in,
|
|
lco_const_info::in, hlds_goal::in, list(prog_var)::out) is semidet.
|
|
|
|
potentially_transformable_recursive_call(Info, ConstInfo, Goal, OutArgs) :-
|
|
Goal = hlds_goal(GoalExpr, GoalInfo),
|
|
GoalExpr = plain_call(PredId, ProcId, Args, _Builtin, _UnifyContext,
|
|
_SymName),
|
|
set.member(proc(PredId, ProcId), ConstInfo ^ lci_cur_scc),
|
|
goal_info_get_determinism(GoalInfo) = ConstInfo ^ lci_cur_proc_detism,
|
|
|
|
ModuleInfo = Info ^ lco_module_info,
|
|
ProcInfo = ConstInfo ^ lci_cur_proc_proc,
|
|
proc_info_get_var_table(ProcInfo, VarTable),
|
|
|
|
module_info_proc_info(ModuleInfo, PredId, ProcId, CalleeProcInfo),
|
|
proc_info_get_argmodes(CalleeProcInfo, CalleeArgModes),
|
|
classify_proc_call_args(ModuleInfo, VarTable, Args, CalleeArgModes,
|
|
_InArgs, OutArgs, UnusedArgs),
|
|
UnusedArgs = [],
|
|
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_lco_debug_output_stream(Info, DebugStream, !IO),
|
|
io.write_string(DebugStream, "call output args: ", !IO),
|
|
io.write_line(DebugStream, OutArgs, !IO)
|
|
),
|
|
list.length(OutArgs, NumOutArgs),
|
|
CurrProcOutArgs = ConstInfo ^ lci_cur_proc_outputs,
|
|
list.length(CurrProcOutArgs, NumCurrProcOutArgs),
|
|
NumOutArgs = NumCurrProcOutArgs.
|
|
|
|
% A goal is potentially moveable before a recursive call if it is det, and
|
|
% guaranteed neither to throw an exception nor loop forever (subject to
|
|
% --no-reorder-conj). It is actually moveable if it does not depend on the
|
|
% output of the recursive call.
|
|
%
|
|
% For now we only move unification goals and goals which construct ground
|
|
% terms.
|
|
%
|
|
:- pred potentially_moveable_goal(hlds_goal::in) is semidet.
|
|
|
|
potentially_moveable_goal(Goal) :-
|
|
Goal = hlds_goal(GoalExpr, GoalInfo),
|
|
goal_info_get_determinism(GoalInfo) = detism_det,
|
|
require_complete_switch [GoalExpr]
|
|
(
|
|
GoalExpr = unify(_, _, _, _, _)
|
|
;
|
|
GoalExpr = scope(Reason, SubGoal),
|
|
( if Reason = from_ground_term(_, _) then
|
|
true
|
|
else
|
|
potentially_moveable_goal(SubGoal)
|
|
)
|
|
;
|
|
GoalExpr = generic_call(GenericCall, _, _, _, GenericDetism),
|
|
(
|
|
GenericCall = cast(CastKind),
|
|
% All cast kinds are now moveable, but list them all,
|
|
% to force this code to be looked at if we ever add a new kind.
|
|
( CastKind = unsafe_type_cast
|
|
; CastKind = unsafe_type_inst_cast
|
|
; CastKind = equiv_type_cast
|
|
; CastKind = exists_cast
|
|
; CastKind = subtype_coerce
|
|
),
|
|
GenericDetism = detism_det
|
|
;
|
|
( GenericCall = higher_order(_, _, _, _, _)
|
|
; GenericCall = class_method(_, _, _, _)
|
|
; GenericCall = event_call(_)
|
|
),
|
|
fail
|
|
)
|
|
;
|
|
( GoalExpr = plain_call(_, _, _, _, _, _)
|
|
; GoalExpr = call_foreign_proc(_, _, _, _, _, _, _)
|
|
; GoalExpr = conj(_, _)
|
|
; GoalExpr = disj(_)
|
|
; GoalExpr = switch(_, _, _)
|
|
; GoalExpr = negation(_)
|
|
; GoalExpr = if_then_else(_, _, _, _)
|
|
),
|
|
fail
|
|
;
|
|
GoalExpr = shorthand(_),
|
|
unexpected($pred, "shorthand")
|
|
).
|
|
|
|
% Partition a goal which follows a recursive call goal into those goals
|
|
% which depend directly or indirectly on an output of the recursive call,
|
|
% and those goals which don't.
|
|
%
|
|
:- pred partition_dependent_goal(lco_info::in, lco_const_info::in,
|
|
hlds_goal::in, list(hlds_goal)::in, list(hlds_goal)::out,
|
|
list(hlds_goal)::in, list(hlds_goal)::out,
|
|
set_of_progvar::in, set_of_progvar::out) is det.
|
|
|
|
partition_dependent_goal(_Info, _ConstInfo, Goal,
|
|
!RevDependentGoals, !RevNonDependentGoals, !DelayForVars) :-
|
|
Goal = hlds_goal(_GoalExpr, GoalInfo),
|
|
vars_in_goal(Goal, GoalVars),
|
|
set_of_var.intersect(!.DelayForVars, GoalVars, Intersection),
|
|
( if set_of_var.is_empty(Intersection) then
|
|
!:RevNonDependentGoals = [Goal | !.RevNonDependentGoals]
|
|
else
|
|
!:RevDependentGoals = [Goal | !.RevDependentGoals],
|
|
% Expand the set of variables for which we must delay goals.
|
|
InstmapDelta = goal_info_get_instmap_delta(GoalInfo),
|
|
instmap_delta_changed_vars(InstmapDelta, ChangedVars),
|
|
set_of_var.union(ChangedVars, !DelayForVars)
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred acceptable_construct_unification(lco_info::in, lco_const_info::in,
|
|
set_of_progvar::in, hlds_goal::in,
|
|
bag(prog_var)::in, bag(prog_var)::out) is semidet.
|
|
|
|
acceptable_construct_unification(Info, ConstInfo, DelayForVars, Goal,
|
|
!UnifyInputVars) :-
|
|
Goal = hlds_goal(GoalExpr, _GoalInfo),
|
|
GoalExpr = unify(_, _, _, Unification, _),
|
|
Unification = construct(ConstructedVar, ConsId, ConstructArgVars,
|
|
ArgModes, _, _, SubInfo),
|
|
(
|
|
SubInfo = no_construct_sub_info
|
|
;
|
|
SubInfo = construct_sub_info(MaybeTakeAddrs, _),
|
|
MaybeTakeAddrs = no
|
|
),
|
|
ModuleInfo = Info ^ lco_module_info,
|
|
VarTable = Info ^ lco_var_table,
|
|
acceptable_construct_modes(ModuleInfo, VarTable,
|
|
ConstructArgVars, ArgModes),
|
|
ConsId = du_data_ctor(DuCtor),
|
|
get_cons_repn_defn(ModuleInfo, DuCtor, CtorRepn),
|
|
ConsTag = CtorRepn ^ cr_tag,
|
|
% Our optimization is inapplicable to constants, and its implementation
|
|
% in the code generator can handle only some kinds of functors with args.
|
|
% For example, it does not make sense to take the address of the field
|
|
% of a function symbol of a `notag' type. The only functors it can handle
|
|
% are the ones whose representation is remote_args_tag().
|
|
ConsTag = remote_args_tag(_),
|
|
% If the construction unification has any existential constraints,
|
|
% then ConstructArgVars will have more elements than the number of
|
|
% arguments in ConsRepn ^ cr_args (the extra variables will be the
|
|
% type_infos and/or typeclass_infos providing information about
|
|
% those constraints). This will cause all_delayed_arg_vars_are_full_words
|
|
% to fail.
|
|
%
|
|
% We could work around that fact, but existentially constrained
|
|
% construction unifications are so rare that there is no point.
|
|
all_delayed_arg_vars_are_full_words(ConstructArgVars, CtorRepn ^ cr_args,
|
|
DelayForVars),
|
|
require_det (
|
|
UnifyInputVars0 = !.UnifyInputVars,
|
|
bag.delete(ConstructedVar, !UnifyInputVars),
|
|
bag.insert_list(ConstructArgVars, !UnifyInputVars),
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
ProcInfo = ConstInfo ^ lci_cur_proc_proc,
|
|
proc_info_get_var_table(ProcInfo, ProcVarTable),
|
|
ConstructedVarStr = mercury_var_to_string(ProcVarTable,
|
|
print_name_and_num, ConstructedVar),
|
|
ConsIdStr = mercury_cons_id_to_string(output_debug,
|
|
does_not_need_brackets, ConsId),
|
|
ConstructArgVarStrs = list.map(
|
|
mercury_var_to_string(ProcVarTable, print_name_and_num),
|
|
ConstructArgVars),
|
|
ConstructArgVarsStr = string.join_list(", ", ConstructArgVarStrs),
|
|
get_debug_output_stream(ModuleInfo, DebugStream, !IO),
|
|
io.format(DebugStream,
|
|
"processing unification %s <= %s(%s)\n",
|
|
[s(ConstructedVarStr), s(ConsIdStr), s(ConstructArgVarsStr)],
|
|
!IO),
|
|
|
|
bag.to_assoc_list(UnifyInputVars0, InitialUnifyInputVars),
|
|
bag.to_assoc_list(!.UnifyInputVars, UpdatedUnifyInputVars),
|
|
io.write_string(DebugStream, "initial UnifyInputVars: ", !IO),
|
|
io.write_line(DebugStream, InitialUnifyInputVars, !IO),
|
|
io.write_string(DebugStream, "updated UnifyInputVars: ", !IO),
|
|
io.write_line(DebugStream, UpdatedUnifyInputVars, !IO)
|
|
)
|
|
).
|
|
|
|
:- pred all_delayed_arg_vars_are_full_words(list(prog_var)::in,
|
|
list(constructor_arg_repn)::in, set_of_progvar::in) is semidet.
|
|
|
|
all_delayed_arg_vars_are_full_words([], [], _).
|
|
all_delayed_arg_vars_are_full_words([ArgVar | ArgVars], [ArgRepn | ArgRepns],
|
|
DelayForVars) :-
|
|
ArgWidth = ArgRepn ^ car_pos_width,
|
|
(
|
|
ArgWidth = apw_full(_, _)
|
|
;
|
|
ArgWidth = apw_double(_, _, _),
|
|
% XXX I (zs) am not sure whether this works. Until I am,
|
|
% failing here plays things safe.
|
|
fail
|
|
;
|
|
( ArgWidth = apw_none_nowhere
|
|
; ArgWidth = apw_none_shifted(_, _)
|
|
),
|
|
% XXX We *could* allow lco to apply to fill in the values of
|
|
% dummy variables by passing a dummy pointer to some static
|
|
% variable we never read. However, it would be *far* simpler
|
|
% to just fill in the one possible value before the recursive call.
|
|
% XXX We don't do that yet either. Since code that fills in
|
|
% the value of a variable of a dummy type after recursive call
|
|
% is as rare as hen's teeth, this is not a great loss.
|
|
fail
|
|
;
|
|
( ArgWidth = apw_partial_first(_, _, _, _, _, _)
|
|
; ArgWidth = apw_partial_shifted(_, _, _, _, _, _)
|
|
),
|
|
% It is ok for the cell to have subword arguments (packed two or more
|
|
% into a single word) IF AND ONLY IF we don't try to take
|
|
% their addresses.
|
|
not set_of_var.member(DelayForVars, ArgVar)
|
|
),
|
|
all_delayed_arg_vars_are_full_words(ArgVars, ArgRepns, DelayForVars).
|
|
|
|
:- pred transform_call_and_unifies(hlds_goal::in, list(prog_var)::in,
|
|
list(hlds_goal)::in, bag(prog_var)::in, maybe(list(hlds_goal))::out,
|
|
lco_info::in, lco_info::out, lco_const_info::in) is det.
|
|
|
|
transform_call_and_unifies(CallGoal, CallOutArgVars, UnifyGoals,
|
|
UnifyInputVars, MaybeGoals, !Info, ConstInfo) :-
|
|
CallGoal = hlds_goal(CallGoalExpr, CallGoalInfo),
|
|
ModuleInfo = !.Info ^ lco_module_info,
|
|
CurProcInfo = ConstInfo ^ lci_cur_proc_proc,
|
|
( if
|
|
CallGoalExpr = plain_call(PredId, ProcId, ArgVars, Builtin,
|
|
UnifyContext, _SymName),
|
|
CurrProcOutArgs = ConstInfo ^ lci_cur_proc_outputs,
|
|
assoc_list.from_corresponding_lists(CallOutArgVars, CurrProcOutArgs,
|
|
CallHeadPairs),
|
|
find_args_to_pass_by_addr(ConstInfo, UnifyInputVars, CallHeadPairs,
|
|
1, Mismatches, UpdatedCallOutArgs, map.init, Subst, !Info),
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_debug_output_stream(ModuleInfo, DebugStream, !IO),
|
|
io.write_string(DebugStream, "find_args_to_pass_by_addr:\n", !IO),
|
|
io.write_string(DebugStream, "call head pairs: ", !IO),
|
|
io.write_line(DebugStream, CallHeadPairs, !IO),
|
|
io.write_string(DebugStream, "mismatches: ", !IO),
|
|
io.write_line(DebugStream, Mismatches, !IO),
|
|
io.write_string(DebugStream, "updated call out args: ", !IO),
|
|
io.write_line(DebugStream, UpdatedCallOutArgs, !IO),
|
|
io.write_string(DebugStream, "substitution: ", !IO),
|
|
map.to_assoc_list(Subst, SubstAL),
|
|
io.write_line(DebugStream, SubstAL, !IO),
|
|
io.nl(DebugStream, !IO)
|
|
),
|
|
% If there are no mismatches, we would create an identical "variant".
|
|
% Such cases should be optimized using other means.
|
|
Mismatches = [_ | _],
|
|
assoc_list.values(Mismatches, MismatchedCallArgs),
|
|
% The variants we create return each output in only one place in
|
|
% memory.
|
|
all_true(occurs_once(UnifyInputVars), MismatchedCallArgs),
|
|
|
|
list.map_foldl2(update_construct(ConstInfo, Subst),
|
|
UnifyGoals, UpdatedUnifyGoals, map.init, AddrFieldIds, !Info),
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_debug_output_stream(ModuleInfo, DebugStream, !IO),
|
|
VarTable = !.Info ^ lco_var_table,
|
|
VarNameSrc = vns_var_table(VarTable),
|
|
CurPredInfo = ConstInfo ^ lci_cur_proc_pred,
|
|
pred_info_get_typevarset(CurPredInfo, TVarSet),
|
|
proc_info_get_inst_varset(CurProcInfo, InstVarSet),
|
|
io.write_string(DebugStream, "original unifies:\n", !IO),
|
|
list.foldl(
|
|
dump_goal_nl(DebugStream, ModuleInfo, VarNameSrc,
|
|
TVarSet, InstVarSet),
|
|
UnifyGoals, !IO),
|
|
io.write_string(DebugStream, "updated unifies:\n", !IO),
|
|
list.foldl(
|
|
dump_goal_nl(DebugStream, ModuleInfo, VarNameSrc,
|
|
TVarSet, InstVarSet),
|
|
UpdatedUnifyGoals, !IO),
|
|
io.write_string(DebugStream, "addr field ids:\n", !IO),
|
|
map.to_assoc_list(AddrFieldIds, AddrFieldIdsAL),
|
|
io.write_line(DebugStream, AddrFieldIdsAL, !IO)
|
|
),
|
|
HighLevelData = ConstInfo ^ lci_highlevel_data,
|
|
make_variant_args(HighLevelData, AddrFieldIds, Mismatches,
|
|
VariantArgs),
|
|
ensure_variant_exists(PredId, ProcId, VariantArgs,
|
|
VariantPredProcId, VariantSymName, !Info)
|
|
then
|
|
proc_info_get_var_table(CurProcInfo, CurProcVarTable),
|
|
module_info_proc_info(ModuleInfo, PredId, ProcId, CalleeProcInfo),
|
|
proc_info_get_argmodes(CalleeProcInfo, CalleeModes),
|
|
update_call_args(ModuleInfo, CurProcVarTable, CalleeModes, ArgVars,
|
|
UpdatedCallOutArgs, UpdatedArgs),
|
|
VariantPredProcId = proc(VariantPredId, VariantProcId),
|
|
UpdatedGoalExpr = plain_call(VariantPredId, VariantProcId,
|
|
UpdatedArgs, Builtin, UnifyContext, VariantSymName),
|
|
OrigCallPurity = goal_info_get_purity(CallGoalInfo),
|
|
% If the original call was pure, then taking away its output
|
|
% allows the simplify pass to just delete it from the procedure.
|
|
% To prevent this, we mark the call as impure. However, we don't
|
|
% want this to make the whole procedure body impure, so we wrap
|
|
% a promise_purity scope around the pre-call unifications and the call
|
|
% that together do what the call and the post-call unifications
|
|
% originally did, and thus has the same purity. Since the unifications
|
|
% are always pure, this purity is the call's original purity.
|
|
goal_info_set_purity(purity_impure, CallGoalInfo, UpdatedGoalInfo),
|
|
UpdatedGoal = hlds_goal(UpdatedGoalExpr, UpdatedGoalInfo),
|
|
Goals = UpdatedUnifyGoals ++ [UpdatedGoal],
|
|
( if OrigCallPurity = purity_impure then
|
|
% The promise_purity scope would be redundant.
|
|
MaybeGoals = yes(Goals)
|
|
else
|
|
% Copying the nonlocals and instmap delta fields of ConjGoal and
|
|
% PromiseGoal from the corresponding fields of CallGoal is
|
|
% definitely wrong, since the conjunction binds the variables
|
|
% that in the original code were bound by the post-call
|
|
% unifications. We *could* cobble together the right values
|
|
% of both fields from the corresponding fields of CallGoal and
|
|
% UnifyGoals, but letting quantification and mode analysis do
|
|
% the job lets us avoid duplicating their here.
|
|
%
|
|
% The other fields of goal_infos are either ok to copy
|
|
% (such as determinism), or irrelevant (such as goal id).
|
|
% The most complex case is goal features. However, at the moment
|
|
% I (zs) believe that all the possible values of the goal_features
|
|
% type fall into one of four categories:
|
|
%
|
|
% - Those that are never attached to calls.
|
|
% - Those that are never attached to anything before the lco pass.
|
|
% - Those that are never looked at after the lco pass.
|
|
% - Those that are ok to copy to the conjunction and the scope.
|
|
%
|
|
% None need to be deleted from the conjunction or the scope.
|
|
ConjGoalExpr = conj(plain_conj, Goals),
|
|
ConjGoal = hlds_goal(ConjGoalExpr, UpdatedGoalInfo),
|
|
PromiseGoalExpr = scope(promise_purity(OrigCallPurity), ConjGoal),
|
|
PromiseGoal = hlds_goal(PromiseGoalExpr, UpdatedGoalInfo),
|
|
MaybeGoals = yes([PromiseGoal])
|
|
),
|
|
!Info ^ lco_changed := proc_changed
|
|
else
|
|
% The reversed conjunction does not follow the pattern we are looking
|
|
% for, so we cannot optimize it.
|
|
MaybeGoals = no
|
|
).
|
|
|
|
:- pred occurs_once(bag(prog_var)::in, prog_var::in) is semidet.
|
|
|
|
occurs_once(Bag, Var) :-
|
|
bag.count_value(Bag, Var, 1).
|
|
|
|
:- pred update_call_args(module_info::in, var_table::in, list(mer_mode)::in,
|
|
list(prog_var)::in, list(prog_var)::in, list(prog_var)::out) is det.
|
|
|
|
update_call_args(_ModuleInfo, _VarTable, [], [], UpdatedCallOutArgVars, []) :-
|
|
expect(unify(UpdatedCallOutArgVars, []), $pred,
|
|
"updating nonexistent arg").
|
|
update_call_args(_ModuleInfo, _VarTable, [], [_ | _], _, _) :-
|
|
unexpected($pred, "mismatched lists").
|
|
update_call_args(_ModuleInfo, _VarTable, [_ | _], [], _, _) :-
|
|
unexpected($pred, "mismatched lists").
|
|
update_call_args(ModuleInfo, VarTable, [CalleeMode | CalleeModes],
|
|
[ArgVar | ArgVars], !.UpdatedCallOutArgVars, !:UpdatedArgVars) :-
|
|
lookup_var_type(VarTable, ArgVar, CalleeType),
|
|
mode_to_top_functor_mode(ModuleInfo, CalleeMode, CalleeType,
|
|
TopFunctorMode),
|
|
(
|
|
TopFunctorMode = top_in,
|
|
update_call_args(ModuleInfo, VarTable, CalleeModes, ArgVars,
|
|
!.UpdatedCallOutArgVars, !:UpdatedArgVars),
|
|
!:UpdatedArgVars = [ArgVar | !.UpdatedArgVars]
|
|
;
|
|
TopFunctorMode = top_out,
|
|
(
|
|
!.UpdatedCallOutArgVars = [UpdatedArgVar | !:UpdatedCallOutArgVars]
|
|
;
|
|
!.UpdatedCallOutArgVars = [],
|
|
unexpected($pred, "no UpdatedCallOutArgs")
|
|
),
|
|
update_call_args(ModuleInfo, VarTable, CalleeModes, ArgVars,
|
|
!.UpdatedCallOutArgVars, !:UpdatedArgVars),
|
|
!:UpdatedArgVars = [UpdatedArgVar | !.UpdatedArgVars]
|
|
;
|
|
TopFunctorMode = top_unused,
|
|
unexpected($pred, "top_unused")
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred classify_proc_call_args(module_info::in, var_table::in,
|
|
list(prog_var)::in, list(mer_mode)::in,
|
|
list(prog_var)::out, list(prog_var)::out, list(prog_var)::out) is det.
|
|
|
|
classify_proc_call_args(_ModuleInfo, _VarTable, [], [], [], [], []).
|
|
classify_proc_call_args(_ModuleInfo, _VarTable, [], [_ | _], _, _, _) :-
|
|
unexpected($pred, "mismatched lists").
|
|
classify_proc_call_args(_ModuleInfo, _VarTable, [_ | _], [], _, _, _) :-
|
|
unexpected($pred, "mismatched lists").
|
|
classify_proc_call_args(ModuleInfo, VarTable, [Arg | Args],
|
|
[CalleeMode | CalleeModes], !:InArgs, !:OutArgs, !:UnusedArgs) :-
|
|
classify_proc_call_args(ModuleInfo, VarTable, Args, CalleeModes,
|
|
!:InArgs, !:OutArgs, !:UnusedArgs),
|
|
lookup_var_type(VarTable, Arg, CalleeType),
|
|
mode_to_top_functor_mode(ModuleInfo, CalleeMode, CalleeType,
|
|
TopFunctorMode),
|
|
(
|
|
TopFunctorMode = top_in,
|
|
!:InArgs = [Arg | !.InArgs]
|
|
;
|
|
TopFunctorMode = top_out,
|
|
!:OutArgs = [Arg | !.OutArgs]
|
|
;
|
|
TopFunctorMode = top_unused,
|
|
!:UnusedArgs = [Arg | !.UnusedArgs]
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred find_args_to_pass_by_addr(lco_const_info::in, bag(prog_var)::in,
|
|
assoc_list(prog_var, prog_var)::in, int::in,
|
|
assoc_list(int, prog_var)::out, list(prog_var)::out,
|
|
map(prog_var, prog_var)::in, map(prog_var, prog_var)::out,
|
|
lco_info::in, lco_info::out) is det.
|
|
|
|
find_args_to_pass_by_addr(_ConstInfo, _, [], _, [], [], !Subst, !Info).
|
|
find_args_to_pass_by_addr(ConstInfo, UnifyInputVars,
|
|
[CallArg - HeadArg | CallHeadArgs], ArgNum, Mismatches,
|
|
[UpdatedCallArg | UpdatedCallArgs], !Subst, !Info) :-
|
|
find_args_to_pass_by_addr(ConstInfo, UnifyInputVars, CallHeadArgs,
|
|
ArgNum + 1, MismatchesTail, UpdatedCallArgs, !Subst, !Info),
|
|
( if
|
|
ConstInfo ^ lci_allow_float_addr = do_not_allow_float_addr,
|
|
lookup_var_type(!.Info ^ lco_var_table, CallArg, CallArgType),
|
|
type_to_ctor(CallArgType, CallArgTypeCtor),
|
|
CallArgTypeCtor = type_ctor(unqualified("float"), 0)
|
|
then
|
|
!Info ^ lco_permitted := lco_is_not_permitted_on_scc
|
|
else
|
|
true
|
|
),
|
|
( if CallArg = HeadArg then
|
|
UpdatedCallArg = CallArg,
|
|
Mismatches = MismatchesTail,
|
|
( if bag.member(HeadArg, UnifyInputVars) then
|
|
% This is a fix for Mantis bug 103. If CallArg is both a head
|
|
% variable AND used in a unification that we are trying to move
|
|
% before the recursive call, like this:
|
|
%
|
|
% rec_call(..., HV2, X),
|
|
% HV3 = functor(HV2, X)
|
|
%
|
|
% then each call through this recursive call site is next to a
|
|
% unification that creates a cell with a field (in this case
|
|
% the first field) that needs to be set to the value of HV2
|
|
% finally computed by a base case. After the Nth recursive call,
|
|
% there will be N cells. There is no way we can pass N addresses
|
|
% to the base case without making the transformed code pass a
|
|
% LIST of addresses in place of HV2 in the argument list.
|
|
% That would be a different transformation than what lco.m does,
|
|
% and it is far from clear that that transformation would be a
|
|
% good idea, since it doubles the number of loop iterations
|
|
% we would need to execute (N recursive calls, and N iterations
|
|
% of a loop to fill in the fields).
|
|
%
|
|
% Instead, we just disable the application of the lco
|
|
% transformation to this call.
|
|
|
|
!Info ^ lco_permitted := lco_is_not_permitted_on_scc
|
|
else
|
|
true
|
|
)
|
|
else
|
|
make_address_var(ConstInfo, CallArg, UpdatedCallArg, !Info),
|
|
Mismatches = [ArgNum - CallArg | MismatchesTail],
|
|
map.det_insert(CallArg, UpdatedCallArg, !Subst)
|
|
).
|
|
|
|
:- pred make_address_var(lco_const_info::in, prog_var::in, prog_var::out,
|
|
lco_info::in, lco_info::out) is det.
|
|
|
|
make_address_var(ConstInfo, Var, AddrVar, !Info) :-
|
|
VarTable0 = !.Info ^ lco_var_table,
|
|
lookup_var_entry(VarTable0, Var, VarEntry),
|
|
Name = var_entry_name_default(Var, VarEntry, "SCCcallarg"),
|
|
VarEntry = vte(_, VarType, _VarTypeIsDummy),
|
|
HighLevelData = ConstInfo ^ lci_highlevel_data,
|
|
(
|
|
HighLevelData = no,
|
|
AddrVarType = make_ref_type(VarType)
|
|
;
|
|
HighLevelData = yes,
|
|
% We set the actual type later when it is more convenient.
|
|
AddrVarType = void_type
|
|
),
|
|
AddrName = "Addr" ++ Name,
|
|
AddrVarEntry = vte(AddrName, AddrVarType, is_not_dummy_type),
|
|
add_var_entry(AddrVarEntry, AddrVar, VarTable0, VarTable),
|
|
!Info ^ lco_var_table := VarTable.
|
|
|
|
:- func make_ref_type(mer_type) = mer_type.
|
|
|
|
make_ref_type(FieldType) = PtrType :-
|
|
RefTypeName = qualified(mercury_private_builtin_module,
|
|
"store_at_ref_type"),
|
|
PtrType = defined_type(RefTypeName, [FieldType], kind_star).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred make_variant_args(bool::in, map(prog_var, field_id)::in,
|
|
assoc_list(int, prog_var)::in, list(variant_arg)::out) is det.
|
|
|
|
make_variant_args(HighLevelData, AddrVarFieldIds, Mismatches, VariantArgs) :-
|
|
(
|
|
HighLevelData = no,
|
|
MakeArg = (func(Pos - _Var) = variant_arg(Pos, no))
|
|
;
|
|
HighLevelData = yes,
|
|
MakeArg =
|
|
( func(Pos - Var) = variant_arg(Pos, yes(FieldId)) :-
|
|
map.lookup(AddrVarFieldIds, Var, FieldId)
|
|
)
|
|
),
|
|
VariantArgs = list.map(MakeArg, Mismatches).
|
|
|
|
:- pred ensure_variant_exists(pred_id::in, proc_id::in, list(variant_arg)::in,
|
|
pred_proc_id::out, sym_name::out, lco_info::in, lco_info::out) is semidet.
|
|
|
|
ensure_variant_exists(PredId, ProcId, AddrOutArgs, VariantPredProcId,
|
|
VariantSymName, !Info) :-
|
|
PredProcId = proc(PredId, ProcId),
|
|
CurSCCVariants0 = !.Info ^ lco_cur_scc_variants,
|
|
( if
|
|
multi_map.search(CurSCCVariants0, PredProcId, ExistingVariantIds),
|
|
match_existing_variant(ExistingVariantIds, AddrOutArgs,
|
|
ExistingVariantId)
|
|
then
|
|
ExistingVariantId = variant_id(_, VariantPredProcId, VariantSymName)
|
|
else
|
|
( if
|
|
multi_map.search(CurSCCVariants0, PredProcId, ExistingVariants)
|
|
then
|
|
VariantNumber = list.length(ExistingVariants) + 1
|
|
else
|
|
VariantNumber = 1
|
|
),
|
|
VariantNumber =< max_variants_per_proc,
|
|
|
|
ModuleInfo0 = !.Info ^ lco_module_info,
|
|
module_info_get_name(ModuleInfo0, ModuleName),
|
|
module_info_pred_info(ModuleInfo0, PredId, PredInfo),
|
|
PredOrFunc = pred_info_is_pred_or_func(PredInfo),
|
|
pred_info_get_name(PredInfo, PredName),
|
|
Transform = tn_last_call_modulo_cons(PredOrFunc, VariantNumber),
|
|
% Even if PredInfo describes a predicate opt-imported from another
|
|
% module, the variant we construct is defined in *this* module.
|
|
make_transformed_pred_name(PredName, Transform, VariantName),
|
|
|
|
some [!VariantPredInfo] (
|
|
!:VariantPredInfo = PredInfo,
|
|
VariantSymName = qualified(ModuleName, VariantName),
|
|
pred_info_set_module_name(ModuleName, !VariantPredInfo),
|
|
pred_info_set_name(VariantName, !VariantPredInfo),
|
|
pred_info_set_is_pred_or_func(pf_predicate, !VariantPredInfo),
|
|
|
|
pred_info_get_origin(PredInfo, Origin0),
|
|
AddrOutArgNums = list.map(va_pos, AddrOutArgs),
|
|
ProcTransform = proc_transform_lcmc(VariantNumber, AddrOutArgNums),
|
|
Origin = origin_proc_transform(ProcTransform, Origin0,
|
|
PredId, ProcId),
|
|
pred_info_set_origin(Origin, !VariantPredInfo),
|
|
|
|
% We throw away any other procs in the variant predicate, because
|
|
% we create a separate predicate for each variant.
|
|
%
|
|
% update_variant_pred_info will update the proc_info
|
|
% after transforming it.
|
|
pred_info_get_proc_table(PredInfo, ProcTable),
|
|
map.lookup(ProcTable, ProcId, ProcInfo),
|
|
VariantProcTable = map.singleton(ProcId, ProcInfo),
|
|
pred_info_set_proc_table(VariantProcTable, !VariantPredInfo),
|
|
|
|
module_info_get_predicate_table(ModuleInfo0, PredTable0),
|
|
predicate_table_insert(!.VariantPredInfo, VariantPredId,
|
|
PredTable0, PredTable),
|
|
module_info_set_predicate_table(PredTable,
|
|
ModuleInfo0, ModuleInfo)
|
|
),
|
|
|
|
VariantPredProcId = proc(VariantPredId, ProcId),
|
|
!Info ^ lco_module_info := ModuleInfo,
|
|
|
|
NewVariant =
|
|
variant_id(AddrOutArgs, VariantPredProcId, VariantSymName),
|
|
multi_map.set(PredProcId, NewVariant, CurSCCVariants0, CurSCCVariants),
|
|
!Info ^ lco_cur_scc_variants := CurSCCVariants
|
|
).
|
|
|
|
:- pred match_existing_variant(list(variant_id)::in, list(variant_arg)::in,
|
|
variant_id::out) is semidet.
|
|
|
|
match_existing_variant([VariantId0 | VariantIds], AddrArgNums, VariantId) :-
|
|
( if VariantId0 = variant_id(AddrArgNums, _, _) then
|
|
VariantId = VariantId0
|
|
else
|
|
match_existing_variant(VariantIds, AddrArgNums, VariantId)
|
|
).
|
|
|
|
:- func max_variants_per_proc = int.
|
|
|
|
max_variants_per_proc = 4.
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred update_construct(lco_const_info::in, map(prog_var, prog_var)::in,
|
|
hlds_goal::in, hlds_goal::out,
|
|
map(prog_var, field_id)::in, map(prog_var, field_id)::out,
|
|
lco_info::in, lco_info::out) is det.
|
|
|
|
update_construct(ConstInfo, Subst, Goal0, Goal, !AddrVarFieldIds, !Info) :-
|
|
Goal0 = hlds_goal(GoalExpr0, GoalInfo0),
|
|
( if
|
|
GoalExpr0 = unify(LHS, RHS0, Mode, Unification0, UnifyContext),
|
|
Unification0 = construct(Var, ConsId, ArgVars, ArgModes,
|
|
How, IsUnique, SubInfo0),
|
|
(
|
|
SubInfo0 = no_construct_sub_info,
|
|
TermSizeSlot = no
|
|
;
|
|
SubInfo0 = construct_sub_info(no, TermSizeSlot)
|
|
)
|
|
then
|
|
% For high-level data, we should not be using the `take_address_fields'
|
|
% feature in `construct_sub_info', but simply assign the new cell to
|
|
% each of the variables that takes its address. But as support for
|
|
% partial instantiation is incomplete, instmaps for the assignments are
|
|
% likely to be recomputed incorrectly.
|
|
HighLevelData = ConstInfo ^ lci_highlevel_data,
|
|
VarTable0 = !.Info ^ lco_var_table,
|
|
lookup_var_entry(VarTable0, Var, VarEntry),
|
|
VarEntry = vte(_, VarType, IsDummy),
|
|
InstMapDelta0 = goal_info_get_instmap_delta(GoalInfo0),
|
|
update_construct_args(Subst, HighLevelData, VarType, IsDummy,
|
|
ConsId, 1, ArgVars, UpdatedArgVars, AddrFields,
|
|
InstMapDelta0, InstMapDelta, !AddrVarFieldIds,
|
|
VarTable0, VarTable),
|
|
!Info ^ lco_var_table := VarTable,
|
|
(
|
|
AddrFields = [],
|
|
Goal = Goal0
|
|
;
|
|
AddrFields = [_ | _],
|
|
SubInfo = construct_sub_info(yes(AddrFields), TermSizeSlot),
|
|
Unification = construct(Var, ConsId, UpdatedArgVars, ArgModes,
|
|
How, IsUnique, SubInfo),
|
|
% We must update RHS because quantification gets the set of
|
|
% variables in the unification from there, not from Unification.
|
|
(
|
|
RHS0 = rhs_var(_),
|
|
unexpected($pred, "var RHS")
|
|
;
|
|
RHS0 = rhs_functor(RHSConsId, IsExistConstr, RHSVars0),
|
|
expect(unify(ConsId, RHSConsId), $pred, "cons_id mismatch"),
|
|
rename_var_list(need_not_rename, Subst, RHSVars0, RHSVars),
|
|
RHS = rhs_functor(RHSConsId, IsExistConstr, RHSVars)
|
|
;
|
|
RHS0 = rhs_lambda_goal(_, _, _, _, _, _, _),
|
|
unexpected($pred, "lambda RHS")
|
|
),
|
|
GoalExpr = unify(LHS, RHS, Mode, Unification, UnifyContext),
|
|
|
|
% For high-level data, there is a lie in this instmap_delta: the
|
|
% new cell is not yet ground, although it will become ground after
|
|
% the call that follows the construction.
|
|
goal_info_set_instmap_delta(InstMapDelta, GoalInfo0, GoalInfo),
|
|
Goal = hlds_goal(GoalExpr, GoalInfo)
|
|
)
|
|
else
|
|
unexpected($pred, "not construct")
|
|
).
|
|
|
|
:- pred update_construct_args(map(prog_var, prog_var)::in, bool::in,
|
|
mer_type::in, is_dummy_type::in, cons_id::in, int::in, list(prog_var)::in,
|
|
list(prog_var)::out, list(int)::out, instmap_delta::in, instmap_delta::out,
|
|
map(prog_var, field_id)::in, map(prog_var, field_id)::out,
|
|
var_table::in, var_table::out) is det.
|
|
|
|
update_construct_args(_, _, _, _, _, _, [], [], [],
|
|
!InstMapDelta, !AddrFieldIds, !VarTable).
|
|
update_construct_args(Subst, HighLevelData, VarType, IsDummyType,
|
|
ConsId, ArgNum, [OrigVar | OrigVars], [UpdatedVar | UpdatedVars],
|
|
AddrArgs, !InstMapDelta, !AddrFieldIds, !VarTable) :-
|
|
update_construct_args(Subst, HighLevelData, VarType, IsDummyType,
|
|
ConsId, ArgNum + 1, OrigVars, UpdatedVars, AddrArgsTail,
|
|
!InstMapDelta, !AddrFieldIds, !VarTable),
|
|
( if map.search(Subst, OrigVar, AddrVar) then
|
|
UpdatedVar = AddrVar,
|
|
(
|
|
HighLevelData = no,
|
|
FinalInst = ground_inst
|
|
;
|
|
HighLevelData = yes,
|
|
BoundFunctor = bound_functor_with_free_arg(ConsId, ArgNum),
|
|
FinalInst = bound(shared, inst_test_no_results, [BoundFunctor]),
|
|
% We didn't do this when we initially created the variable.
|
|
lookup_var_entry(!.VarTable, AddrVar, AddrVarEntry0),
|
|
AddrVarEntry0 = vte(AddrVarName, _, _),
|
|
% XXX Why is it that VarType, and its IsDummyType companion,
|
|
% do not depend on which field we are taking the address of?
|
|
AddrVarEntry = vte(AddrVarName, VarType, IsDummyType),
|
|
update_var_entry(AddrVar, AddrVarEntry, !VarTable)
|
|
),
|
|
instmap_delta_set_var(AddrVar, FinalInst, !InstMapDelta),
|
|
FieldId = field_id(VarType, ConsId, ArgNum),
|
|
map.det_insert(OrigVar, FieldId, !AddrFieldIds),
|
|
AddrArgs = [ArgNum | AddrArgsTail]
|
|
else
|
|
UpdatedVar = OrigVar,
|
|
AddrArgs = AddrArgsTail
|
|
).
|
|
|
|
:- func bound_functor_with_free_arg(cons_id, int) = bound_functor.
|
|
|
|
bound_functor_with_free_arg(ConsId, FreeArg) = Inst :-
|
|
Arity = cons_id_arity(ConsId),
|
|
list.duplicate(Arity, ground_inst, ArgInsts0),
|
|
list.det_replace_nth(ArgInsts0, FreeArg, free_inst, ArgInsts),
|
|
Inst = bound_functor(ConsId, ArgInsts).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred acceptable_construct_modes(module_info::in, var_table::in,
|
|
list(prog_var)::in, list(unify_mode)::in) is semidet.
|
|
|
|
acceptable_construct_modes(_, _, [], []).
|
|
acceptable_construct_modes(_, _, [], [_ | _]) :-
|
|
unexpected($pred, "list length mismatch").
|
|
acceptable_construct_modes(_, _, [_ | _], []) :-
|
|
unexpected($pred, "list length mismatch").
|
|
acceptable_construct_modes(ModuleInfo, VarTable,
|
|
[Var | Vars], [UnifyMode | UnifyModes]) :-
|
|
lookup_var_type(VarTable, Var, Type),
|
|
UnifyMode = unify_modes_li_lf_ri_rf(InitInstX, FinalInstX,
|
|
InitInstY, FinalInstY),
|
|
inst_is_free(ModuleInfo, InitInstX),
|
|
inst_is_ground(ModuleInfo, Type, InitInstY),
|
|
inst_is_ground(ModuleInfo, Type, FinalInstX),
|
|
inst_is_ground(ModuleInfo, Type, FinalInstY),
|
|
acceptable_construct_modes(ModuleInfo, VarTable, Vars, UnifyModes).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred store_updated_procs_in_module_info(pair(pred_proc_id, proc_info)::in,
|
|
module_info::in, module_info::out) is det.
|
|
|
|
store_updated_procs_in_module_info(PredProcId - NewProcInfo, !ModuleInfo) :-
|
|
PredProcId = proc(PredId, ProcId),
|
|
module_info_pred_info(!.ModuleInfo, PredId, PredInfo0),
|
|
pred_info_get_proc_table(PredInfo0, Procs0),
|
|
map.det_update(ProcId, NewProcInfo, Procs0, Procs),
|
|
pred_info_set_proc_table(Procs, PredInfo0, PredInfo),
|
|
module_info_set_pred_info(PredId, PredInfo, !ModuleInfo).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred update_variant_pred_info(variant_map::in,
|
|
pair(pred_proc_id, variant_id)::in,
|
|
module_info::in, module_info::out) is det.
|
|
|
|
update_variant_pred_info(VariantMap, PredProcId - VariantId, !ModuleInfo) :-
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_debug_output_stream(!.ModuleInfo, DebugStream, !IO),
|
|
io.write_string(DebugStream, "\nupdate_variant_pred_info ", !IO),
|
|
io.write_line(DebugStream, PredProcId, !IO),
|
|
io.write_line(DebugStream, VariantId, !IO)
|
|
),
|
|
VariantId = variant_id(AddrOutArgs, VariantPredProcId, _VariantSymName),
|
|
VariantPredProcId = proc(VariantPredId, VariantProcId),
|
|
PredProcId = proc(PredId, ProcId),
|
|
|
|
module_info_pred_proc_info(!.ModuleInfo, PredId, ProcId,
|
|
PredInfo, ProcInfo),
|
|
lco_transform_variant_proc(VariantMap, AddrOutArgs, PredInfo, ProcInfo,
|
|
VariantProcInfo, !ModuleInfo),
|
|
|
|
proc_info_get_headvars(VariantProcInfo, HeadVars),
|
|
proc_info_get_var_table(VariantProcInfo, VarTable),
|
|
lookup_var_types(VarTable, HeadVars, ArgTypes),
|
|
|
|
some [!VariantPredInfo] (
|
|
module_info_pred_info(!.ModuleInfo, VariantPredId, !:VariantPredInfo),
|
|
% Put the updated arg type information in the VariantProcInfo
|
|
% we just constructed into !VariantPredInfo.
|
|
pred_info_get_arg_types(!.VariantPredInfo,
|
|
TVarSet, ExistQVars, _ArgTypes0),
|
|
pred_info_set_arg_types(TVarSet, ExistQVars, ArgTypes,
|
|
!VariantPredInfo),
|
|
% Put the VariantProcInfo we just constructed into !VariantPredInfo.
|
|
VariantProcs = map.singleton(VariantProcId, VariantProcInfo),
|
|
pred_info_set_proc_table(VariantProcs, !VariantPredInfo),
|
|
module_info_set_pred_info(VariantPredId, !.VariantPredInfo,
|
|
!ModuleInfo)
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred lco_transform_variant_proc(variant_map::in, list(variant_arg)::in,
|
|
pred_info::in, proc_info::in, proc_info::out,
|
|
module_info::in, module_info::out) is det.
|
|
|
|
lco_transform_variant_proc(VariantMap, AddrOutArgs, PredInfo, ProcInfo,
|
|
!:VariantProcInfo, !ModuleInfo) :-
|
|
!:VariantProcInfo = ProcInfo,
|
|
proc_info_get_var_table(ProcInfo, VarTable0),
|
|
proc_info_get_headvars(ProcInfo, HeadVars0),
|
|
proc_info_get_argmodes(ProcInfo, ArgModes0),
|
|
make_addr_vars(!.ModuleInfo, 1, HeadVars0, HeadVars, ArgModes0, ArgModes,
|
|
AddrOutArgs, VarToAddr, VarTable0, VarTable),
|
|
proc_info_set_headvars(HeadVars, !VariantProcInfo),
|
|
proc_info_set_argmodes(ArgModes, !VariantProcInfo),
|
|
proc_info_set_var_table(VarTable, !VariantProcInfo),
|
|
|
|
proc_info_get_initial_instmap(!.ModuleInfo, ProcInfo, InstMap0),
|
|
proc_info_get_goal(ProcInfo, Goal0),
|
|
lco_transform_variant_goal(!.ModuleInfo,
|
|
groundings_and_lco_calls(set_of_var.init), VariantMap,
|
|
VarToAddr, InstMap0, Goal0, Goal, Changed, !VariantProcInfo),
|
|
trace [compiletime(flag("lco")), io(!IO)] (
|
|
get_debug_output_stream(!.ModuleInfo, DebugStream, !IO),
|
|
io.write_string(DebugStream, "\nlco_transform_variant_proc\n", !IO),
|
|
(
|
|
Changed = no,
|
|
io.write_string(DebugStream, "unchanged\n", !IO)
|
|
;
|
|
Changed = yes,
|
|
io.write_string(DebugStream, "goal before:\n", !IO),
|
|
pred_info_get_typevarset(PredInfo, TVarSet),
|
|
proc_info_get_inst_varset(!.VariantProcInfo, InstVarSet),
|
|
dump_goal_nl(DebugStream, !.ModuleInfo, vns_var_table(VarTable),
|
|
TVarSet, InstVarSet, Goal0, !IO),
|
|
io.write_string(DebugStream, "\ngoal after:\n", !IO),
|
|
dump_goal_nl(DebugStream, !.ModuleInfo, vns_var_table(VarTable),
|
|
TVarSet, InstVarSet, Goal, !IO)
|
|
)
|
|
),
|
|
proc_info_set_goal(Goal, !VariantProcInfo),
|
|
% We changed the scopes of the headvars we now return via pointers.
|
|
requantify_proc_general(ord_nl_no_lambda, !VariantProcInfo),
|
|
|
|
% The high-level data transformation requires instmap deltas
|
|
% to be recomputed.
|
|
module_info_get_globals(!.ModuleInfo, Globals),
|
|
globals.get_target(Globals, Target),
|
|
(
|
|
Target = target_c
|
|
;
|
|
( Target = target_java
|
|
; Target = target_csharp
|
|
),
|
|
recompute_instmap_delta_proc(no_recomp_atomics,
|
|
!VariantProcInfo, !ModuleInfo)
|
|
).
|
|
|
|
:- pred make_addr_vars(module_info::in, int::in,
|
|
list(prog_var)::in, list(prog_var)::out,
|
|
list(mer_mode)::in, list(mer_mode)::out,
|
|
list(variant_arg)::in, var_to_target::out,
|
|
var_table::in, var_table::out) is det.
|
|
|
|
make_addr_vars(_, _, [], [], [], [], AddrOutArgs, [], !VarTable) :-
|
|
expect(unify(AddrOutArgs, []), $pred, "AddrOutArgs != []").
|
|
make_addr_vars(_, _, [], _, [_ | _], _, _, _, !VarTable) :-
|
|
unexpected($pred, "mismatched lists").
|
|
make_addr_vars(_, _, [_ | _], _, [], _, _, _, !VarTable) :-
|
|
unexpected($pred, "mismatched lists").
|
|
make_addr_vars(ModuleInfo, NextOutArgNum,
|
|
[HeadVar0 | HeadVars0], [HeadVar | HeadVars],
|
|
[Mode0 | Modes0], [Mode | Modes],
|
|
!.AddrOutArgs, VarToAddr, !VarTable) :-
|
|
lookup_var_entry(!.VarTable, HeadVar0, HeadVarEntry0),
|
|
HeadVarType = HeadVarEntry0 ^ vte_type,
|
|
mode_to_top_functor_mode(ModuleInfo, Mode0, HeadVarType, TopFunctorMode),
|
|
(
|
|
TopFunctorMode = top_in,
|
|
HeadVar = HeadVar0,
|
|
Mode = Mode0,
|
|
make_addr_vars(ModuleInfo, NextOutArgNum,
|
|
HeadVars0, HeadVars, Modes0, Modes,
|
|
!.AddrOutArgs, VarToAddr, !VarTable)
|
|
;
|
|
TopFunctorMode = top_out,
|
|
( if
|
|
!.AddrOutArgs = [AddrOutArg | !:AddrOutArgs],
|
|
AddrOutArg = variant_arg(NextOutArgNum, MaybeFieldId)
|
|
then
|
|
HeadVarName = var_entry_name(HeadVar0, HeadVarEntry0),
|
|
AddrVarName = "AddrOf" ++ HeadVarName,
|
|
(
|
|
MaybeFieldId = no,
|
|
% For low-level data we replace the output argument with a
|
|
% store_at_ref_type(T) input argument.
|
|
AddrVarType = make_ref_type(HeadVarType),
|
|
AddrVarTypeIsDummy = is_not_dummy_type,
|
|
Mode = in_mode
|
|
;
|
|
MaybeFieldId = yes(field_id(AddrVarType, ConsId, ArgNum)),
|
|
% For high-level data we replace the output argument with a
|
|
% partially instantiated structure. The structure has one
|
|
% argument left unfilled.
|
|
AddrVarTypeIsDummy = is_type_a_dummy(ModuleInfo, AddrVarType),
|
|
BoundFunctor = bound_functor_with_free_arg(ConsId, ArgNum),
|
|
InitialInst =
|
|
bound(shared, inst_test_no_results, [BoundFunctor]),
|
|
Mode = from_to_mode(InitialInst, ground_inst)
|
|
),
|
|
AddrVarEntry = vte(AddrVarName, AddrVarType, AddrVarTypeIsDummy),
|
|
add_var_entry(AddrVarEntry, AddrVar, !VarTable),
|
|
HeadVar = AddrVar,
|
|
make_addr_vars(ModuleInfo, NextOutArgNum + 1,
|
|
HeadVars0, HeadVars, Modes0, Modes,
|
|
!.AddrOutArgs, VarToAddrTail, !VarTable),
|
|
VarToAddrHead = HeadVar0 - store_target(AddrVar, MaybeFieldId),
|
|
VarToAddr = [VarToAddrHead | VarToAddrTail]
|
|
else
|
|
HeadVar = HeadVar0,
|
|
Mode = Mode0,
|
|
make_addr_vars(ModuleInfo, NextOutArgNum + 1,
|
|
HeadVars0, HeadVars, Modes0, Modes,
|
|
!.AddrOutArgs, VarToAddr, !VarTable)
|
|
)
|
|
;
|
|
TopFunctorMode = top_unused,
|
|
unexpected($pred, "top_unused")
|
|
).
|
|
|
|
% The lco_transform_variant_* predicates can perform two transformations.
|
|
%
|
|
% The first transformation is done by lco_transform_variant_atomic_goal.
|
|
% It takes atomic goals that ground one or more of the output arguments
|
|
% of the current procedure that we are supposed to return not by the usual
|
|
% route, but by filling in a memory cell whose address we are given.
|
|
% We have to perform this transformation whereever it is applicable
|
|
% in the body of the procedure.
|
|
%
|
|
% The second transformation is done by lco_transform_variant_plain_call.
|
|
% It checks whether the callee of a plain call goal has an lco-optimized
|
|
% variant that is applicable to the call site, and if yes, calls that
|
|
% variant instead of the original predicate. In the usual case where
|
|
% the callee is recursive, this is basically a short-circuiting operation:
|
|
% instead of calling first (say) p, which then calls lco-optimized-p
|
|
% which then calls itself, we call lco-optimized-p directly. The main
|
|
% benefit here is that the short-circuited code has a smaller footprint
|
|
% in the instruction cache, and will thus probably get fewer misses there.
|
|
%
|
|
% However, the second transformation replaces code that would record
|
|
% the value of the lco-optimized output variables of the callee in the
|
|
% current procedure's stack frame with code that puts the values of those
|
|
% variables in fields in heap cells. Any attempt by later code to look up
|
|
% the values of these variables would thus result in a compiler crash
|
|
% in the code generator (Mantis bug #539). We can therefore apply this
|
|
% tranformation (named lco_calls in this type) ONLY if the affected
|
|
% variables are NOT needed by later code. The argument of the second
|
|
% function symbol here gives the set of variables whose values *are*
|
|
% needed by later code.
|
|
%
|
|
:- type variant_transforms
|
|
---> groundings_only
|
|
; groundings_and_lco_calls(set_of_progvar).
|
|
|
|
:- pred lco_transform_variant_goal(module_info::in, variant_transforms::in,
|
|
variant_map::in, var_to_target::in, instmap::in,
|
|
hlds_goal::in, hlds_goal::out, bool::out,
|
|
proc_info::in, proc_info::out) is det.
|
|
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap, VarToAddr,
|
|
InstMap0, Goal0, Goal, Changed, !ProcInfo) :-
|
|
Goal0 = hlds_goal(GoalExpr0, GoalInfo0),
|
|
(
|
|
GoalExpr0 = conj(ConjType, Goals0),
|
|
(
|
|
ConjType = plain_conj,
|
|
% We want to process the conjuncts of the conjunction backwards,
|
|
% from last conjunct to first conjunct, so that when we process
|
|
% a conjunct, we know what variables the conjuncts to its right
|
|
% need as inputs. (This info is needed for the fix of Mantis
|
|
% bug #539.)
|
|
%
|
|
% However, processing each goal requires its initial instmap,
|
|
% and we can apply instmaps only from front to back. So we get
|
|
% rev_conj_and_attach_init_instmaps to record the initial instmap
|
|
% of each conjunct with that conjunct, and at the same time
|
|
% reverse the list. We then give this reversed, instmap-annotated
|
|
% list to lco_transform_variant_rev_conj.
|
|
rev_conj_and_attach_init_instmaps(InstMap0, Goals0,
|
|
[], RevGoalIMs0),
|
|
lco_transform_variant_rev_conj(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, RevGoalIMs0, cord.init, GoalsCord, Changed,
|
|
!ProcInfo),
|
|
GoalExpr = conj(ConjType, cord.list(GoalsCord)),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
ConjType = parallel_conj,
|
|
unexpected($pred, "parallel_conj")
|
|
)
|
|
;
|
|
GoalExpr0 = disj(Goals0),
|
|
list.map2_foldl(
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap0),
|
|
Goals0, Goals, DisjsChanged, !ProcInfo),
|
|
Changed = bool.or_list(DisjsChanged),
|
|
GoalExpr = disj(Goals),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = switch(Var, CanFail, Cases0),
|
|
list.map2_foldl(
|
|
lco_transform_variant_case(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap0),
|
|
Cases0, Cases, CasesChanged, !ProcInfo),
|
|
Changed = bool.or_list(CasesChanged),
|
|
GoalExpr = switch(Var, CanFail, Cases),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = if_then_else(Vars, Cond, Then0, Else0),
|
|
apply_goal_instmap_delta(Cond, InstMap0, InstMap1),
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap1, Then0, Then, ThenChanged, !ProcInfo),
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap0, Else0, Else, ElseChanged, !ProcInfo),
|
|
Changed = bool.or(ThenChanged, ElseChanged),
|
|
GoalExpr = if_then_else(Vars, Cond, Then, Else),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = scope(Reason, SubGoal0),
|
|
( if
|
|
Reason = from_ground_term(FGTVar, FGT),
|
|
( FGT = from_ground_term_construct
|
|
; FGT = from_ground_term_deconstruct
|
|
)
|
|
then
|
|
( if
|
|
list.member(FGTVarPair, VarToAddr),
|
|
FGTVarPair = FGTVar - _
|
|
then
|
|
% We can treat such a scope as an atomic goal, since all we
|
|
% care about is with either is that it makes the variable
|
|
% we're interested in ground.
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr,
|
|
InstMap0, GoalInfo0, GoalExpr0, GoalExpr, Changed,
|
|
!ProcInfo)
|
|
else
|
|
GoalExpr = GoalExpr0,
|
|
Changed = no
|
|
)
|
|
else
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap0, SubGoal0, SubGoal, Changed, !ProcInfo),
|
|
GoalExpr = scope(Reason, SubGoal)
|
|
),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = negation(_),
|
|
GoalExpr = GoalExpr0,
|
|
GoalInfo = GoalInfo0,
|
|
Changed = no
|
|
;
|
|
GoalExpr0 = generic_call(_, _, _, _, _),
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr,
|
|
InstMap0, GoalInfo0, GoalExpr0, GoalExpr, Changed, !ProcInfo),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = plain_call(_, _, _, _, _, _),
|
|
lco_transform_variant_plain_call(ModuleInfo, Transforms, VariantMap,
|
|
VarToAddr, InstMap0, GoalExpr0, GoalExpr,
|
|
GoalInfo0, GoalInfo, Changed, !ProcInfo)
|
|
;
|
|
GoalExpr0 = unify(_, _, _, _, _),
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr,
|
|
InstMap0, GoalInfo0, GoalExpr0, GoalExpr, Changed, !ProcInfo),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = call_foreign_proc(_, _, _, _, _, _, _),
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr,
|
|
InstMap0, GoalInfo0, GoalExpr0, GoalExpr, Changed, !ProcInfo),
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
GoalExpr0 = shorthand(_),
|
|
% These should have been expanded out by now.
|
|
unexpected($pred, "shorthand")
|
|
),
|
|
(
|
|
Changed = yes,
|
|
% This is not actually necessary for the transformation used for
|
|
% high-level data.
|
|
goal_info_set_purity(purity_impure, GoalInfo, GoalInfoImpure),
|
|
Goal = hlds_goal(GoalExpr, GoalInfoImpure)
|
|
;
|
|
Changed = no,
|
|
Goal = Goal0
|
|
).
|
|
|
|
:- type goal_and_init_instmap
|
|
---> goal_and_init_instmap(hlds_goal, instmap).
|
|
|
|
:- pred rev_conj_and_attach_init_instmaps(instmap::in, list(hlds_goal)::in,
|
|
list(goal_and_init_instmap)::in, list(goal_and_init_instmap)::out) is det.
|
|
|
|
rev_conj_and_attach_init_instmaps(_, [], !RevGoalIMs).
|
|
rev_conj_and_attach_init_instmaps(InstMap0, [Goal | Goals], !RevGoalIMs) :-
|
|
GoalIM = goal_and_init_instmap(Goal, InstMap0),
|
|
!:RevGoalIMs = [GoalIM | !.RevGoalIMs],
|
|
apply_goal_instmap_delta(Goal, InstMap0, InstMap1),
|
|
rev_conj_and_attach_init_instmaps(InstMap1, Goals, !RevGoalIMs).
|
|
|
|
:- pred lco_transform_variant_rev_conj(module_info::in, variant_transforms::in,
|
|
variant_map::in, var_to_target::in,
|
|
list(goal_and_init_instmap)::in, cord(hlds_goal)::in, cord(hlds_goal)::out,
|
|
bool::out, proc_info::in, proc_info::out) is det.
|
|
|
|
lco_transform_variant_rev_conj(_, _, _, _, [], !Conjuncts, no, !ProcInfo).
|
|
lco_transform_variant_rev_conj(ModuleInfo, Transforms0, VariantMap, VarToAddr,
|
|
[RevGoalIM0 | RevGoalIMs0], !Conjuncts, Changed, !ProcInfo) :-
|
|
RevGoalIM0 = goal_and_init_instmap(RevGoal0, RevGoalInitInstMap),
|
|
lco_transform_variant_goal(ModuleInfo, Transforms0, VariantMap, VarToAddr,
|
|
RevGoalInitInstMap, RevGoal0, RevGoal, HeadChanged, !ProcInfo),
|
|
RevGoal = hlds_goal(RevGoalExpr, RevGoalInfo),
|
|
(
|
|
Transforms0 = groundings_only,
|
|
Transforms1 = groundings_only
|
|
;
|
|
Transforms0 = groundings_and_lco_calls(NeededLaterVars0),
|
|
% XXX The value of Transforms starts out as groundings_and_lco_calls,
|
|
% and this is the only logical place where it could transition to
|
|
% groundings_only. We could e.g. switch to groundings_only
|
|
% when we encounter nonrecursive calls in our backward traversal.
|
|
%
|
|
% However, if we did that, then lco_transform_variant_plain_call's
|
|
% handling of groundings_and_lco_calls would not get tested
|
|
% when compiling tests/valid/bug539.m. Also, not switching
|
|
% to groundings_only here should yield very slightly faster code,
|
|
% as explained in the comment on the variant_transforms type.
|
|
get_input_vars_needed_by_goal(RevGoalInitInstMap, RevGoalInfo,
|
|
NeededVars),
|
|
set_of_var.union(NeededVars, NeededLaterVars0, NeededLaterVars1),
|
|
Transforms1 = groundings_and_lco_calls(NeededLaterVars1)
|
|
),
|
|
lco_transform_variant_rev_conj(ModuleInfo, Transforms1, VariantMap,
|
|
VarToAddr, RevGoalIMs0, !Conjuncts, TailChanged, !ProcInfo),
|
|
Changed = bool.or(HeadChanged, TailChanged),
|
|
( if RevGoalExpr = conj(plain_conj, RevGoalSubConjuncts) then
|
|
cord.snoc_list(RevGoalSubConjuncts, !Conjuncts)
|
|
else
|
|
cord.snoc(RevGoal, !Conjuncts)
|
|
).
|
|
|
|
:- pred get_input_vars_needed_by_goal(instmap::in, hlds_goal_info::in,
|
|
set_of_progvar::out) is det.
|
|
|
|
get_input_vars_needed_by_goal(InstMap0, GoalInfo, NeededVars) :-
|
|
% A goal may need the value of a variable from preceding code if
|
|
% - the variable already has an inst before the goal, and
|
|
% - the goal actually refers to the variable.
|
|
%
|
|
% Technically, we want only the vars in InstMap0 whose inst is more
|
|
% instantiated than just "free". However, the vast majority of variables
|
|
% are bound by their first occurrence, so they already more instantiated
|
|
% than "free" when they are first put into an instmap. We can afford
|
|
% to be too-conservative with the remainder. (Including variables
|
|
% in InstMapVars even when they are free errs on the side of caution.)
|
|
instmap_vars(InstMap0, InstMapVars),
|
|
NonLocals = goal_info_get_nonlocals(GoalInfo),
|
|
NeededVars = set_of_var.intersect(InstMapVars, NonLocals).
|
|
|
|
:- pred lco_transform_variant_case(module_info::in, variant_transforms::in,
|
|
variant_map::in, var_to_target::in, instmap::in,
|
|
case::in, case::out, bool::out, proc_info::in, proc_info::out) is det.
|
|
|
|
lco_transform_variant_case(ModuleInfo, Transforms, VariantMap, VarToAddr,
|
|
InstMap0, Case0, Case, Changed, !ProcInfo) :-
|
|
Case0 = case(MainConsId, OtherConsIds, Goal0),
|
|
lco_transform_variant_goal(ModuleInfo, Transforms, VariantMap, VarToAddr,
|
|
InstMap0, Goal0, Goal, Changed, !ProcInfo),
|
|
Case = case(MainConsId, OtherConsIds, Goal).
|
|
|
|
:- pred lco_transform_variant_plain_call(module_info::in,
|
|
variant_transforms::in, variant_map::in, var_to_target::in, instmap::in,
|
|
hlds_goal_expr::in(goal_expr_plain_call), hlds_goal_expr::out,
|
|
hlds_goal_info::in, hlds_goal_info::out, bool::out,
|
|
proc_info::in, proc_info::out) is det.
|
|
|
|
lco_transform_variant_plain_call(ModuleInfo, Transforms, VariantMap, VarToAddr,
|
|
InstMap0, GoalExpr0, GoalExpr, GoalInfo0, GoalInfo, Changed,
|
|
!ProcInfo) :-
|
|
apply_goal_info_instmap_delta(GoalInfo0, InstMap0, InstMap1),
|
|
proc_info_get_var_table(!.ProcInfo, VarTable),
|
|
list.filter(is_grounding(ModuleInfo, VarTable, InstMap0, InstMap1),
|
|
VarToAddr, GroundingVarToAddr),
|
|
(
|
|
GroundingVarToAddr = [],
|
|
GoalExpr = GoalExpr0,
|
|
GoalInfo = GoalInfo0,
|
|
Changed = no
|
|
;
|
|
GroundingVarToAddr = [_ | _],
|
|
% Check if there is a variant of the called procedure where we can pass
|
|
% an address variable in place of each variable that would be ground by
|
|
% the call.
|
|
GoalExpr0 = plain_call(CallPredId, CallProcId, ArgVars, Builtin,
|
|
UnifyContext, _SymName),
|
|
CallPredProcId = proc(CallPredId, CallProcId),
|
|
module_info_proc_info(ModuleInfo, CallPredId, CallProcId,
|
|
CalleeProcInfo),
|
|
proc_info_get_argmodes(CalleeProcInfo, CalleeArgModes),
|
|
( if
|
|
multi_map.search(VariantMap, CallPredProcId, ExistingVariantIds),
|
|
classify_proc_call_args(ModuleInfo, VarTable,
|
|
ArgVars, CalleeArgModes,
|
|
_InArgVars, OutArgVars, _UnusedArgVars),
|
|
grounding_to_variant_args(GroundingVarToAddr, 1, OutArgVars, Subst,
|
|
VariantArgVars, VariantArgs),
|
|
match_existing_variant(ExistingVariantIds, VariantArgs,
|
|
ExistingVariantId),
|
|
|
|
% The need for the test done by the rest of this condition
|
|
% is explained by the comment on the variant_transforms type.
|
|
Transforms = groundings_and_lco_calls(NeededVarsSet),
|
|
set_of_var.list_to_set(VariantArgVars, VariantArgVarSet),
|
|
set_of_var.intersect(NeededVarsSet, VariantArgVarSet,
|
|
NeededOutArgVarsSet),
|
|
set_of_var.is_empty(NeededOutArgVarsSet)
|
|
then
|
|
rename_var_list(need_not_rename, Subst, ArgVars, CallArgVars),
|
|
ExistingVariantId = variant_id(_, VariantPredProcId,
|
|
VariantSymName),
|
|
VariantPredProcId = proc(VariantPredId, VariantProcId),
|
|
GoalExpr = plain_call(VariantPredId, VariantProcId, CallArgVars,
|
|
Builtin, UnifyContext, VariantSymName),
|
|
|
|
module_info_get_globals(ModuleInfo, Globals),
|
|
globals.get_target(Globals, Target),
|
|
(
|
|
Target = target_c,
|
|
GoalInfo = GoalInfo0
|
|
;
|
|
( Target = target_java
|
|
; Target = target_csharp
|
|
),
|
|
% The partially instantiated cells will be ground
|
|
% after the call.
|
|
list.map(pair.fst, GroundingVarToAddr, GroundVars),
|
|
map.apply_to_list(GroundVars, Subst, AddrVars),
|
|
InstMapDelta0 = goal_info_get_instmap_delta(GoalInfo0),
|
|
instmap_delta_set_vars_same(ground_inst, AddrVars,
|
|
InstMapDelta0, InstMapDelta),
|
|
goal_info_set_instmap_delta(InstMapDelta, GoalInfo0, GoalInfo)
|
|
),
|
|
Changed = yes
|
|
else
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr, InstMap0,
|
|
GoalInfo0, GoalExpr0, GoalExpr, Changed, !ProcInfo),
|
|
GoalInfo = GoalInfo0
|
|
)
|
|
).
|
|
|
|
:- pred lco_transform_variant_atomic_goal(module_info::in, var_to_target::in,
|
|
instmap::in, hlds_goal_info::in, hlds_goal_expr::in, hlds_goal_expr::out,
|
|
bool::out, proc_info::in, proc_info::out) is det.
|
|
|
|
lco_transform_variant_atomic_goal(ModuleInfo, VarToAddr, InstMap0,
|
|
GoalInfo, GoalExpr0, GoalExpr, Changed, !ProcInfo) :-
|
|
apply_goal_info_instmap_delta(GoalInfo, InstMap0, InstMap1),
|
|
proc_info_get_var_table(!.ProcInfo, VarTable),
|
|
list.filter(is_grounding(ModuleInfo, VarTable, InstMap0, InstMap1),
|
|
VarToAddr, GroundingVarToAddr),
|
|
(
|
|
GroundingVarToAddr = [],
|
|
GoalExpr = GoalExpr0,
|
|
Changed = no
|
|
;
|
|
GroundingVarToAddr = [_ | _],
|
|
list.map_foldl(make_store_goal(ModuleInfo, InstMap1),
|
|
GroundingVarToAddr, StoreGoals, !ProcInfo),
|
|
GoalExpr = conj(plain_conj,
|
|
[hlds_goal(GoalExpr0, GoalInfo) | StoreGoals]),
|
|
Changed = yes
|
|
).
|
|
|
|
:- pred grounding_to_variant_args(assoc_list(prog_var, store_target)::in,
|
|
int::in, list(prog_var)::in, prog_var_renaming::out,
|
|
list(prog_var)::out, list(variant_arg)::out) is det.
|
|
|
|
grounding_to_variant_args(GroundingVarToAddr, OutArgNum, OutArgVars, Subst,
|
|
VariantArgVars, VariantArgs) :-
|
|
(
|
|
OutArgVars = [],
|
|
Subst = map.init,
|
|
VariantArgVars = [],
|
|
VariantArgs = []
|
|
;
|
|
OutArgVars = [OutArgVar | OutArgVarsTail],
|
|
grounding_to_variant_args(GroundingVarToAddr, OutArgNum + 1,
|
|
OutArgVarsTail, Subst0, VariantArgVarsTail, VariantArgsTail),
|
|
( if assoc_list.search(GroundingVarToAddr, OutArgVar, StoreTarget) then
|
|
StoreTarget = store_target(StoreArgVar, MaybeFieldId),
|
|
map.det_insert(OutArgVar, StoreArgVar, Subst0, Subst),
|
|
VariantArg = variant_arg(OutArgNum, MaybeFieldId),
|
|
VariantArgVars = [OutArgVar | VariantArgVarsTail],
|
|
VariantArgs = [VariantArg | VariantArgsTail]
|
|
else
|
|
Subst = Subst0,
|
|
VariantArgVars = VariantArgVarsTail,
|
|
VariantArgs = VariantArgsTail
|
|
)
|
|
).
|
|
|
|
:- pred make_store_goal(module_info::in, instmap::in,
|
|
pair(prog_var, store_target)::in, hlds_goal::out,
|
|
proc_info::in, proc_info::out) is det.
|
|
|
|
make_store_goal(ModuleInfo, InstMap, GroundVar - StoreTarget, Goal,
|
|
!ProcInfo) :-
|
|
StoreTarget = store_target(AddrVar, MaybeFieldId),
|
|
(
|
|
% Low-level data.
|
|
MaybeFieldId = no,
|
|
generate_plain_call(ModuleInfo, pf_predicate,
|
|
mercury_private_builtin_module, "store_at_ref_impure",
|
|
[], [AddrVar, GroundVar], instmap_delta_bind_vars([]), only_mode,
|
|
detism_det, purity_impure, [], dummy_context, Goal)
|
|
;
|
|
% High-level data.
|
|
MaybeFieldId = yes(field_id(AddrVarType, ConsId, ArgNum)),
|
|
get_cons_id_arg_types(ModuleInfo, AddrVarType, ConsId, ArgTypes),
|
|
make_unification_args(ModuleInfo, GroundVar, ArgNum, 1, ArgTypes,
|
|
ArgVars, ArgModes, !ProcInfo),
|
|
|
|
RHS = rhs_functor(ConsId, is_not_exist_constr, ArgVars),
|
|
|
|
instmap_lookup_var(InstMap, AddrVar, AddrVarInst0),
|
|
inst_expand(ModuleInfo, AddrVarInst0, AddrVarInst),
|
|
UnifyMode = unify_modes_li_lf_ri_rf(AddrVarInst, ground_inst,
|
|
ground_inst, ground_inst),
|
|
|
|
Unification = deconstruct(AddrVar, ConsId, ArgVars, ArgModes,
|
|
cannot_fail, cannot_cgc),
|
|
UnifyContext = unify_context(umc_implicit("lcmc"), []),
|
|
|
|
GoalExpr = unify(AddrVar, RHS, UnifyMode, Unification, UnifyContext),
|
|
|
|
goal_info_init(GoalInfo0),
|
|
goal_info_set_determinism(detism_det, GoalInfo0, GoalInfo1),
|
|
goal_info_set_instmap_delta(instmap_delta_bind_var(AddrVar),
|
|
GoalInfo1, GoalInfo),
|
|
|
|
Goal = hlds_goal(GoalExpr, GoalInfo)
|
|
).
|
|
|
|
:- pred make_unification_args(module_info::in, prog_var::in, int::in, int::in,
|
|
list(mer_type)::in, list(prog_var)::out, list(unify_mode)::out,
|
|
proc_info::in, proc_info::out) is det.
|
|
|
|
make_unification_args(ModuleInfo, GroundVar, TargetArgNum, CurArgNum, ArgTypes,
|
|
ArgVars, ArgModes, !ProcInfo) :-
|
|
(
|
|
ArgTypes = [],
|
|
ArgVars = [],
|
|
ArgModes = []
|
|
;
|
|
ArgTypes = [ArgType | ArgTypesTail],
|
|
make_unification_args(ModuleInfo, GroundVar, TargetArgNum,
|
|
CurArgNum + 1, ArgTypesTail, ArgVarsTail, ArgModesTail, !ProcInfo),
|
|
make_unification_arg(ModuleInfo, GroundVar, TargetArgNum,
|
|
CurArgNum, ArgType, Var, ArgMode, !ProcInfo),
|
|
ArgVars = [Var | ArgVarsTail],
|
|
ArgModes = [ArgMode | ArgModesTail]
|
|
).
|
|
|
|
:- pred make_unification_arg(module_info::in, prog_var::in, int::in, int::in,
|
|
mer_type::in, prog_var::out, unify_mode::out,
|
|
proc_info::in, proc_info::out) is det.
|
|
|
|
make_unification_arg(ModuleInfo, GroundVar, TargetArgNum, CurArgNum,
|
|
ArgType, Var, UnifyMode, !ProcInfo) :-
|
|
( if CurArgNum = TargetArgNum then
|
|
Var = GroundVar,
|
|
UnifyMode = unify_modes_li_lf_ri_rf(free_inst, ground_inst,
|
|
ground_inst, ground_inst)
|
|
else
|
|
% Bind other arguments to fresh variables.
|
|
ArgTypeIsDummy = is_type_a_dummy(ModuleInfo, ArgType),
|
|
proc_info_create_var_from_type("", ArgType, ArgTypeIsDummy,
|
|
Var, !ProcInfo),
|
|
UnifyMode = unify_modes_li_lf_ri_rf(ground_inst, ground_inst,
|
|
free_inst, ground_inst)
|
|
).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred is_grounding(module_info::in, var_table::in, instmap::in, instmap::in,
|
|
pair(prog_var, store_target)::in) is semidet.
|
|
|
|
is_grounding(ModuleInfo, VarTable, InstMap0, InstMap, Var - _StoreTarget) :-
|
|
lookup_var_type(VarTable, Var, Type),
|
|
instmap_lookup_var(InstMap0, Var, Inst0),
|
|
not inst_is_ground(ModuleInfo, Type, Inst0),
|
|
instmap_is_reachable(InstMap),
|
|
instmap_lookup_var(InstMap, Var, Inst),
|
|
inst_is_ground(ModuleInfo, Type, Inst).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
|
|
:- pred get_lco_debug_output_stream(lco_info::in, io.text_output_stream::out,
|
|
io::di, io::uo) is det.
|
|
|
|
get_lco_debug_output_stream(Info, DebugStream, !IO) :-
|
|
ModuleInfo = Info ^ lco_module_info,
|
|
get_debug_output_stream(ModuleInfo, DebugStream, !IO).
|
|
|
|
%---------------------------------------------------------------------------%
|
|
:- end_module transform_hlds.lco.
|
|
%---------------------------------------------------------------------------%
|