val regexp_split : Str.regexpval _allocate_space : 'a array array -> 'a array arrayval load_from_file :
?stopwords:(string, 'a) Hashtbl.t ->
string ->
string array arrayval load_from_string :
?stopwords:(string, 'a) Hashtbl.t ->
string ->
string arrayval load_stopwords : string -> (string, int) Hashtbl.tval build_vocabulary :
string array array ->
(string, int) Hashtbl.t * (int, string) Hashtbl.tval tokenise : ('a, 'b) Hashtbl.t -> 'a array -> 'b arrayval tokenise_all : ('a, 'b) Hashtbl.t -> 'a array array -> 'b array arrayval save_vocabulary : 'a -> string -> unitval load_vocabulary : string -> 'aval save_lda_model : 'a -> string -> unitval load_lda_model : string -> 'aval simple_process : 'a -> 'a