123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416open!Core_kernel(** [S_gen] is the type of the module returned by [Incr_map.Make]. It is a specialization
of the interface of [Incr_map], with:
- the ['w] state_witness type parameter removed
- the [Incremental.State.t] argument removed
The comments for components of [S_gen] are in [module type Incr_map] below. *)moduletypeS_gen=sigmoduleIncr:sigtype'atmoduleCutoff:sigtype'atendendvalof_set:('k,'cmp)Set.tIncr.t->('k,unit,'cmp)Map.tIncr.tvalfilter_mapi:?data_equal:('v1->'v1->bool)->('k,'v1,'cmp)Map.tIncr.t->f:(key:'k->data:'v1->'v2option)->('k,'v2,'cmp)Map.tIncr.tvalmapi:?data_equal:('v1->'v1->bool)->('k,'v1,'cmp)Map.tIncr.t->f:(key:'k->data:'v1->'v2)->('k,'v2,'cmp)Map.tIncr.tvalfilter_mapi':?cutoff:'v1Incr.Cutoff.t->?data_equal:('v1->'v1->bool)->('k,'v1,'cmp)Map.tIncr.t->f:(key:'k->data:'v1Incr.t->'v2optionIncr.t)->('k,'v2,'cmp)Map.tIncr.tvalmapi':?cutoff:'v1Incr.Cutoff.t->?data_equal:('v1->'v1->bool)->('k,'v1,'cmp)Map.tIncr.t->f:(key:'k->data:'v1Incr.t->'v2Incr.t)->('k,'v2,'cmp)Map.tIncr.tvalunordered_fold:?data_equal:('v->'v->bool)->?update:(key:'k->old_data:'v->new_data:'v->'acc->'acc)->?specialized_initial:(init:'acc->('k,'v,'cmp)Map.t->'acc)->('k,'v,'cmp)Map.tIncr.t->init:'acc->add:(key:'k->data:'v->'acc->'acc)->remove:(key:'k->data:'v->'acc->'acc)->'accIncr.tvalmerge:?data_equal_left:('v1->'v1->bool)->?data_equal_right:('v2->'v2->bool)->('k,'v1,'cmp)Map.tIncr.t->('k,'v2,'cmp)Map.tIncr.t->f:(key:'k->[`Leftof'v1|`Rightof'v2|`Bothof'v1*'v2]->'v3option)->('k,'v3,'cmp)Map.tIncr.tvalflatten:('k,'vIncr.t,'cmp)Map.t->('k,'v,'cmp)Map.tIncr.tvaljoin:('k,'vIncr.t,'cmp)Map.tIncr.t->('k,'v,'cmp)Map.tIncr.tvalseparate:('k,'v,'cmp)Map.tIncr.t->data_equal:('v->'v->bool)->('k,'vIncr.t,'cmp)Map.tIncr.tvalkeys:('k,'v,'c)Map.tIncr.t->('k,'c)Set.tIncr.tvalsubrange:?data_equal:('v->'v->bool)->('k,'v,'cmp)Map.tIncr.t->('kMaybe_bound.As_lower_bound.t*'kMaybe_bound.As_upper_bound.t)optionIncr.t->('k,'v,'cmp)Map.tIncr.tvalsubrange_by_rank:?data_equal:('v->'v->bool)->('k,'v,'cmp)Map.tIncr.t->(intMaybe_bound.As_lower_bound.t*intMaybe_bound.As_upper_bound.t)Incr.t->('k,'v,'cmp)Map.tIncr.tvalindex_by:('inner_key,'v,'inner_cmp)Map.tIncr.t->comparator:('outer_key,'outer_cmp)Map.comparator->index:('v->'outer_keyoption)->('outer_key,('inner_key,'v,'inner_cmp)Map.t,'outer_cmp)Map.tIncr.tvalunordered_fold_nested_maps:?data_equal:('v->'v->bool)->?update:(outer_key:'outer_key->inner_key:'inner_key->old_data:'v->new_data:'v->'acc->'acc)->('outer_key,('inner_key,'v,'inner_cmp)Map.t,'outer_cmp)Map.tIncr.t->init:'acc->add:(outer_key:'outer_key->inner_key:'inner_key->data:'v->'acc->'acc)->remove:(outer_key:'outer_key->inner_key:'inner_key->data:'v->'acc->'acc)->'accIncr.tvaltranspose:?data_equal:('v->'v->bool)->('k2,'k2_cmp)Map.comparator->('k1,('k2,'v,'k2_cmp)Map.t,'k1_cmp)Map.tIncr.t->('k2,('k1,'v,'k1_cmp)Map.t,'k2_cmp)Map.tIncr.tmoduleLookup:sigtype('k,'v,'cmp)tvalcreate:?data_equal:('v->'v->bool)->('k,'v,'cmp)Map.tIncr.t->comparator:('k,'cmp)Comparator.t->('k,'v,'cmp)tvalfind:('k,'v,_)t->'k->'voptionIncr.tmoduleM(K:sigtypettypecomparator_witnessend):sigtypenonrec'vt=(K.t,'v,K.comparator_witness)tendmoduleFor_debug:sigvalsexp_of_t:('k->Sexp.t)->('v->Sexp.t)->('k,'v,'cmp)t->Sexp.tendendmoduleFor_testing:sigvalfind_key_range_linear:from:int->to_:int->('a,'b,'c)Base.Map.t->('a*'aoption)optionendendmoduletypeIncr_map=sig(** Functions for using maps efficiently within Incremental. The goal of the algorithms
here is to do work on the output of the computation proportional to the amount of
work done on the input. i.e., [k] modifications to the input map for some
computation will result in [k] modifications to the output map. The changes to the
input map are typically computed using [Map.symmetric_diff].
Unless stated otherwise, the non-incremental semantics of these functions (i.e..,
ignoring performance) is the same as the corresponding function in Core_kernel's
[Map] module. *)valof_set:(('k,'cmp)Set.t,'w)Incremental.t->(('k,unit,'cmp)Map.t,'w)Incremental.tvalfilter_mapi:?data_equal:('v1->'v1->bool)->(('k,'v1,'cmp)Map.t,'w)Incremental.t->f:(key:'k->data:'v1->'v2option)->(('k,'v2,'cmp)Map.t,'w)Incremental.tvalmapi:?data_equal:('v1->'v1->bool)->(('k,'v1,'cmp)Map.t,'w)Incremental.t->f:(key:'k->data:'v1->'v2)->(('k,'v2,'cmp)Map.t,'w)Incremental.tvalfilter_mapi':?cutoff:'v1Incremental.Cutoff.t->?data_equal:('v1->'v1->bool)->(('k,'v1,'cmp)Map.t,'w)Incremental.t->f:(key:'k->data:('v1,'w)Incremental.t->('v2option,'w)Incremental.t)->(('k,'v2,'cmp)Map.t,'w)Incremental.tvalmapi':?cutoff:'v1Incremental.Cutoff.t->?data_equal:('v1->'v1->bool)->(('k,'v1,'cmp)Map.t,'w)Incremental.t->f:(key:'k->data:('v1,'w)Incremental.t->('v2,'w)Incremental.t)->(('k,'v2,'cmp)Map.t,'w)Incremental.t(** [unordered_fold i ~init ~add ~remove] constructs a more incremental version of:
{[
let%map m = i in
Map.fold m ~init ~f:add
]}
assuming that [remove] is the inverse of [add], and that the operations for
different keys can be performed in any order. Note that [data_equal] defaults
to [phys_equal], but a more precise equality can be provided instead.
When the data for a key updates, by default [remove] is called on the old data
and then [add] is called on the new data.
[update] provides an alternative single function to call each time a key's data
updates, and can be used to improve efficiency.
For the initial computation, by default [add] is called on all the elements in the
map. As this can be inefficient, [specialized_initial] can be provided to perform
the computation in a more effective way.
*)valunordered_fold:?data_equal:('v->'v->bool)->?update:(key:'k->old_data:'v->new_data:'v->'acc->'acc)->?specialized_initial:(init:'acc->('k,'v,'cmp)Map.t->'acc)->(('k,'v,'cmp)Map.t,'w)Incremental.t->init:'acc->add:(key:'k->data:'v->'acc->'acc)->remove:(key:'k->data:'v->'acc->'acc)->('acc,'w)Incremental.t(** Like [merge] in [Base.Map.merge]. Note that [f] is called at most once per key in
any given stabilization. *)valmerge:?data_equal_left:('v1->'v1->bool)->?data_equal_right:('v2->'v2->bool)->(('k,'v1,'cmp)Map.t,'w)Incremental.t->(('k,'v2,'cmp)Map.t,'w)Incremental.t->f:(key:'k->[`Leftof'v1|`Rightof'v2|`Bothof'v1*'v2]->'v3option)->(('k,'v3,'cmp)Map.t,'w)Incremental.t(** This is the "easy" version of [join] *)valflatten:'wIncremental.State.t->('k,('v,'w)Incremental.t,'cmp)Map.t->(('k,'v,'cmp)Map.t,'w)Incremental.t(** The non-incremental semantics of this function is the identity function. Its
purpose is to collapse the extra level of incrementality at the level of the data of
the map.*)valjoin:(('k,('v,'w)Incremental.t,'cmp)Map.t,'w)Incremental.t->(('k,'v,'cmp)Map.t,'w)Incremental.tvalseparate:(('k,'v,'cmp)Map.t,'w)Incremental.t->data_equal:('v->'v->bool)->(('k,('v,'w)Incremental.t,'cmp)Map.t,'w)Incremental.tvalkeys:(('k,'v,'c)Map.t,'w)Incremental.t->(('k,'c)Set.t,'w)Incremental.t(** [subrange map (min, max)] constructs an incremental submap that includes all of the
keys and data from [map] between [min] and [max], and none of the keys outside the
range.
[subrange map None] is the empty map. [range] being [None] means no elements are
chosen.
Note that incremental changes have a runtime of O((k + m) log n) where k is the size
of the changes to the underlying map and m is the size of the changes to the
elements contained by the range. The complexity of the initial computation is the
same as the incremental computation, with some simplification. k = 0 because we have
not made any changes to the underlying map yet, and m equals the size of the range,
because the initial range is empty. *)valsubrange:?data_equal:('v->'v->bool)->(('k,'v,'cmp)Map.t,'w)Incremental.t->(('kMaybe_bound.As_lower_bound.t*'kMaybe_bound.As_upper_bound.t)option,'w)Incremental.t->(('k,'v,'cmp)Map.t,'w)Incremental.t(** [subrange_by_rank map (s, e)] constructs an incremental submap that includes (e-s+1)
keys between s-th and e-th, inclusive.
If s is greater or equal to map length, the result is empty.
If e is greater or equal to map length, the result contains keys from s-th to the
last one.
Raises for invalid indices - s < 0 or e < s.
Runtime of the initial computation is O(min(e, n-s) + log(n)), i.e. linear,
but optimized for ranges close to beginning or end.
Runtime of the incremental computation is O(log(n) + k + (m+m') * log(n)) where:
- k is the size of the diff
- m is the total impact of map changes on the range, bounded by k (e.g. if we add
1001 keys and remove 1000 below s, then m = 1)
- m' = O( |new s - old s| + |new e - old e| ).
*)valsubrange_by_rank:?data_equal:('v->'v->bool)->(('k,'v,'cmp)Map.t,'w)Incremental.t->(intMaybe_bound.As_lower_bound.t*intMaybe_bound.As_upper_bound.t,'w)Incremental.t->(('k,'v,'cmp)Map.t,'w)Incremental.t(** [index_by map ~comparator ~index] constructs an incremental map-of-maps where each
key-data pair of the input map is present in one (or none) of the inner maps.
[index] specifies the outer map key under which each original key-data pair is
found.
All of the resulting inner maps are guaranteed to be non-empty.
An all-at-once version of [index_by] would look like:
{[
let index_by map ~comparator ~index =
Map.to_alist map
|> List.filter_map ~f:(fun (key, data) ->
match index data with
| None -> None
| Some index -> index, (key, data))
|> Map.of_alist_multi comparator
|> Map.map ~f:(Map.of_alist_exn (Map.comparator_s map))
;;
]} *)valindex_by:(('inner_key,'v,'inner_cmp)Map.t,'w)Incremental.t->comparator:('outer_key,'outer_cmp)Map.comparator->index:('v->'outer_keyoption)->(('outer_key,('inner_key,'v,'inner_cmp)Map.t,'outer_cmp)Map.t,'w)Incremental.tvalunordered_fold_nested_maps:?data_equal:('v->'v->bool)->?update:(outer_key:'outer_key->inner_key:'inner_key->old_data:'v->new_data:'v->'acc->'acc)->(('outer_key,('inner_key,'v,'inner_cmp)Map.t,'outer_cmp)Map.t,'w)Incremental.t->init:'acc->add:(outer_key:'outer_key->inner_key:'inner_key->data:'v->'acc->'acc)->remove:(outer_key:'outer_key->inner_key:'inner_key->data:'v->'acc->'acc)->('acc,'w)Incremental.tvaltranspose:?data_equal:('v->'v->bool)->('k2,'k2_cmp)Map.comparator->(('k1,('k2,'v,'k2_cmp)Map.t,'k1_cmp)Map.t,'w)Incremental.t->(('k2,('k1,'v,'k1_cmp)Map.t,'k2_cmp)Map.t,'w)Incremental.t(** [('k, 'v) Lookup.t] provides a way to lookup keys in a map which uses symmetric
diffs to trigger updates of the lookups.
The complexity of an update depends on:
- [n]: the number of keys in the larger of the old/updated input map
- [k]: the number of lookup nodes created using [find]
- [m]: the number of elements in the symdiff of the maps
- [symdiff(n)]: the cost of performing the symdiff on the map (m <= symdiff(n) <= n)
Each update should cost [O(symdiff(n) + m * log k)], so this will be efficient when
there are a lot of lookups (close to n) into a map which can be efficiently
symdiffed (and therefore has a small number of changes also). The cost of updating
when performing the same lookups by means of [Incr.map ~f:(fun m -> Map.find m key)]
is [O(k * log n)].
*)moduleLookup:sigtype('k,'v,'cmp,'w)t(** Create the lookup structure on an incremental map. *)valcreate:?data_equal:('v->'v->bool)->(('k,'v,'cmp)Map.t,'w)Incremental.t->comparator:('k,'cmp)Comparator.t->('k,'v,'cmp,'w)t(** Create a node which performs [Map.find] on the input map.
[find (create incr_map) key] should be equivalent to [Incr.map ~f:(fun m ->
Map.find m key) incr_map], but when you call [find] many times for a single
[create] the nodes should update more efficiently in stabilisation when [incr_map]
changes in a way which can be efficiently diffed.
This will re-use existing nodes when it can, but will not always do so.
*)valfind:('k,'v,_,'w)t->'k->('voption,'w)Incremental.t(** A convenient way to refer to the type for a given key. *)moduleM(K:sigtypettypecomparator_witnessend):sigtypenonrec('v,'w)t=(K.t,'v,K.comparator_witness,'w)tendmoduleFor_debug:sigvalsexp_of_t:('k->Sexp.t)->('v->Sexp.t)->('k,'v,'cmp,_)t->Sexp.tendendmoduleFor_testing:sigvalfind_key_range_linear:from:int->to_:int->('a,'b,'c)Base.Map.t->('a*'aoption)optionendmoduletypeS_gen=S_genmoduletypeS=sigtypestate_witnessincludeS_genwithtype'aIncr.t=('a,state_witness)Incremental.tandtype'aIncr.Cutoff.t='aIncremental.Cutoff.tandtype('k,'v,'cmp)Lookup.t=('k,'v,'cmp,state_witness)Lookup.tendmoduleMake(Incr:Incremental.S):Swithtypestate_witness:=Incr.state_witnessandmoduleIncr:=Incrend