Source: obj_array.ml (u.e8154ba896059bfe0f59281181c41fac.base.v0.16.4.doc.src.base)

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195open! Import module Int = Int0 module String = String0 module Array = Array0 (* We maintain the property that all values of type [t] do not have the tag [double_array_tag]. Some functions below assume this in order to avoid testing the tag, and will segfault if this property doesn't hold. *) type t = Stdlib.Obj.t array let invariant t = assert (Stdlib.Obj.tag (Stdlib.Obj.repr t) <> Stdlib.Obj.double_array_tag) ;; let length = Array.length (* would check for float arrays in 32 bit, but whatever *) let sexp_of_t t = Sexp.Atom (String.concat ~sep:"" [ "<Obj_array.t of length "; Int.to_string (length t); ">" ]) ;; let zero_obj = Stdlib.Obj.repr (0 : int) (* We call [Array.create] with a value that is not a float so that the array doesn't get tagged with [Double_array_tag]. *) let create_zero ~len = Array.create ~len zero_obj let empty = [||] type not_a_float = | Not_a_float_0 | Not_a_float_1 of int let _not_a_float_0 = Not_a_float_0 let _not_a_float_1 = Not_a_float_1 42 let get t i = (* Make the compiler believe [t] is an array not containing floats so it does not check if [t] is tagged with [Double_array_tag]. It is NOT ok to use [int array] since (if this function is inlined and the array contains in-heap boxed values) wrong register typing may result, leading to a failure to register necessary GC roots. *) Stdlib.Obj.repr (* [Sys.opaque_identity] is required on the array because this code breaks the usual assumptions about array kinds that the Flambda 2 optimiser can see. *) ((Sys.opaque_identity (Stdlib.Obj.magic (t : t) : not_a_float array)).(i) : not_a_float) ;; let[@inline always] unsafe_get t i = (* Make the compiler believe [t] is an array not containing floats so it does not check if [t] is tagged with [Double_array_tag]. *) Stdlib.Obj.repr (Array.unsafe_get (Sys.opaque_identity (Obj_local.magic (t : t) : not_a_float array)) i : not_a_float) ;; let[@inline always] unsafe_set_with_caml_modify t i obj = (* Same comment as [unsafe_get]. Sys.opaque_identity prevents the compiler from potentially wrongly guessing the type of the array based on the type of element, that is prevent the implication: (Obj.tag obj = Obj.double_tag) => (Obj.tag t = Obj.double_array_tag) which flambda has tried in the past (at least that's assuming the compiler respects Sys.opaque_identity, which is not always the case). *) Array.unsafe_set (Sys.opaque_identity (Obj_local.magic (t : t) : not_a_float array)) i (Stdlib.Obj.obj (Sys.opaque_identity obj) : not_a_float) ;; let[@inline always] set_with_caml_modify t i obj = (* same as unsafe_set_with_caml_modify but safe *) (Sys.opaque_identity (Stdlib.Obj.magic (t : t) : not_a_float array)).(i) <- (Stdlib.Obj.obj (Sys.opaque_identity obj) : not_a_float) ;; let[@inline always] unsafe_set_int_assuming_currently_int t i int = (* This skips [caml_modify], which is OK if both the old and new values are integers. *) Array.unsafe_set (Sys.opaque_identity (Obj_local.magic (t : t) : int array)) i (Sys.opaque_identity int) ;; (* For [set] and [unsafe_set], if a pointer is involved, we first do a physical-equality test to see if the pointer is changing. If not, we don't need to do the [set], which saves a call to [caml_modify]. We think this physical-equality test is worth it because it is very cheap (both values are already available from the [is_int] test) and because [caml_modify] is expensive. *) let set t i obj = (* We use [get] first but then we use [Array.unsafe_set] since we know that [i] is valid. *) let old_obj = get t i in if Stdlib.Obj.is_int old_obj && Stdlib.Obj.is_int obj then unsafe_set_int_assuming_currently_int t i (Stdlib.Obj.obj obj : int) else if not (phys_equal old_obj obj) then unsafe_set_with_caml_modify t i obj ;; let[@inline always] unsafe_set t i obj = let old_obj = unsafe_get t i in if Stdlib.Obj.is_int old_obj && Stdlib.Obj.is_int obj then unsafe_set_int_assuming_currently_int t i (Stdlib.Obj.obj obj : int) else if not (phys_equal old_obj obj) then unsafe_set_with_caml_modify t i obj ;; let[@inline always] unsafe_set_omit_phys_equal_check t i obj = let old_obj = unsafe_get t i in if Stdlib.Obj.is_int old_obj && Stdlib.Obj.is_int obj then unsafe_set_int_assuming_currently_int t i (Stdlib.Obj.obj obj : int) else unsafe_set_with_caml_modify t i obj ;; let swap t i j = let a = get t i in let b = get t j in unsafe_set t i b; unsafe_set t j a ;; let create ~len x = (* If we can, use [Array.create] directly. Even though [is_int] check is subsumed by the tag check, checking it is much faster, since it avoids a C function call. *) if Stdlib.Obj.is_int x || Stdlib.Obj.tag x <> Stdlib.Obj.double_tag then Array.create ~len x else ( (* Otherwise use [create_zero] and set the contents *) let t = create_zero ~len in let x = Sys.opaque_identity x in for i = 0 to len - 1 do unsafe_set_with_caml_modify t i x done; t) ;; let singleton obj = create ~len:1 obj (* Pre-condition: t.(i) is an integer. *) let unsafe_set_assuming_currently_int t i obj = if Stdlib.Obj.is_int obj then unsafe_set_int_assuming_currently_int t i (Stdlib.Obj.obj obj : int) else (* [t.(i)] is an integer and [obj] is not, so we do not need to check if they are equal. *) unsafe_set_with_caml_modify t i obj ;; let unsafe_set_int t i int = let old_obj = unsafe_get t i in if Stdlib.Obj.is_int old_obj then unsafe_set_int_assuming_currently_int t i int else unsafe_set_with_caml_modify t i (Stdlib.Obj.repr int) ;; let unsafe_clear_if_pointer t i = let old_obj = unsafe_get t i in if not (Stdlib.Obj.is_int old_obj) then unsafe_set_with_caml_modify t i (Stdlib.Obj.repr 0) ;; (** [unsafe_blit] is like [Array.blit], except it uses our own for-loop to avoid caml_modify when possible. Its performance is still not comparable to a memcpy. *) let unsafe_blit ~src ~src_pos ~dst ~dst_pos ~len = (* When [phys_equal src dst], we need to check whether [dst_pos < src_pos] and have the for loop go in the right direction so that we don't overwrite data that we still need to read. When [not (phys_equal src dst)], doing this is harmless. From a memory-performance perspective, it doesn't matter whether one loops up or down. Constant-stride access, forward or backward, should be indistinguishable (at least on an intel i7). So, we don't do a check for [phys_equal src dst] and always loop up in that case. *) if dst_pos < src_pos then for i = 0 to len - 1 do unsafe_set dst (dst_pos + i) (unsafe_get src (src_pos + i)) done else for i = len - 1 downto 0 do unsafe_set dst (dst_pos + i) (unsafe_get src (src_pos + i)) done ;; include Blit.Make (struct type nonrec t = t let create = create_zero let length = length let unsafe_blit = unsafe_blit end) let copy src = let dst = create_zero ~len:(length src) in blito ~src ~dst (); dst ;;