1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
# 1 "Camomile/public/uCS4.ml"
(** UCS4 encoded string. The type is the bigarray of 32-bit integers.
Bigarray.cma or Bigarray.cmxa must be linked when this module is used. *)
open Bigarray
type t = (int32, int32_elt, c_layout) Array1.t
type index = int
exception Malformed_code
let rec validate_aux (a:t) i =
if i >= Array1.dim a then () else
match Int32.to_int (Int32.shift_right a.{i} 31) with
0 -> validate_aux a (i + 1)
| _ -> raise Malformed_code
let validate (a:t) = validate_aux a 0
let look (a:t) i : UChar.t = UChar.chr_of_uint (Int32.to_int a.{i})
let length (a:t) = Array1.dim a
let next _ i = i + 1
let prev _ i = i - 1
let move (_:t) i c = i + c
let first _ = 0
let last (a:t) = Array1.dim a - 1
let out_of_range (a:t) i = i < 0 || i >= Array1.dim a
let compare_index _ i j = i - j
let nth (_:t) c = c
let get (a:t) c = look a c
let rec iter_aux proc (a:t) i =
if i >= Array1.dim a then () else begin
proc (look a i);
iter_aux proc a (i + 1)
end
let iter proc (a:t) = iter_aux proc a 0
let init len f =
let a = Array1.create int32 c_layout len in
for i = 0 to len - 1 do
a.{i} <- Int32.of_int (UChar.uint_code (f i))
done;
a
module Buf = struct
type buf = {init_size : int; mutable pos : index; mutable contents : t}
let create n =
let contents = Array1.create int32 c_layout n in
{init_size = n; pos = 0; contents = contents}
let clear buf = buf.pos <- 0
let reset buf =
buf.contents <- Array1.create int32 c_layout buf.init_size;
buf.pos <- 0
let contents buf =
let a = Array1.create int32 c_layout buf.pos in
let src = Array1.sub buf.contents 0 buf.pos in
Array1.blit src a;
a
let resize buf n =
if Array1.dim buf.contents >= n then () else
let a = Array1.create int32 c_layout (2 * n) in
let a' = Array1.sub a 0 (Array1.dim buf.contents) in
Array1.blit buf.contents a';
buf.contents <- a
let add_char buf u =
resize buf (buf.pos + 1);
buf.contents.{buf.pos} <- Int32.of_int (UChar.uint_code u);
buf.pos <- buf.pos + 1
let add_string buf (a:t) =
let len = buf.pos + Array1.dim a in
resize buf len;
let b = Array1.sub buf.contents buf.pos (Array1.dim a) in
Array1.blit a b;
buf.pos <- len
let add_buffer buf1 buf2 =
let len = buf1.pos + buf2.pos in
resize buf1 len;
let a = Array1.sub buf2.contents 0 buf2.pos in
let b = Array1.sub buf1.contents buf1.pos buf2.pos in
Array1.blit a b;
buf1.pos <- len
end
let compare (a:t) (b:t) =
match Array1.dim a - Array1.dim b with
0 -> Pervasives.compare a b
| sgn -> sgn