val regexp_split : Str.regexpval _allocate_space : 'a array array -> 'a array arrayval load_from_file :
?stopwords:(string, 'a) Stdlib.Hashtbl.t ->
string ->
string array arrayval load_from_string :
?stopwords:(string, 'a) Stdlib.Hashtbl.t ->
string ->
string arrayval load_stopwords : string -> (string, int) Stdlib.Hashtbl.tval build_vocabulary :
string array array ->
(string, int) Stdlib.Hashtbl.t * (int, string) Stdlib.Hashtbl.tval tokenise : ('a, 'b) Stdlib.Hashtbl.t -> 'c array -> 'd arrayval tokenise_all :
('a, 'b) Stdlib.Hashtbl.t ->
'c array array ->
'd array arrayval save_vocabulary : 'a -> string -> unitval load_vocabulary : string -> 'aval save_lda_model : 'a -> string -> unitval load_lda_model : string -> 'aval simple_process : 'a -> 'b