Module Owl_nlp_utils

val regexp_split : Str.regexp
val _allocate_space : 'a array array -> 'a array array
val load_from_file : ?stopwords:(string, 'a) Stdlib.Hashtbl.t -> string -> string array array
val load_from_string : ?stopwords:(string, 'a) Stdlib.Hashtbl.t -> string -> string array
val load_stopwords : string -> (string, int) Stdlib.Hashtbl.t
val build_vocabulary : string array array -> (string, int) Stdlib.Hashtbl.t * (int, string) Stdlib.Hashtbl.t
val tokenise : ('a, 'b) Stdlib.Hashtbl.t -> 'c array -> 'd array
val tokenise_all : ('a, 'b) Stdlib.Hashtbl.t -> 'c array array -> 'd array array
val save_vocabulary : 'a -> string -> unit
val load_vocabulary : string -> 'a
val save_lda_model : 'a -> string -> unit
val load_lda_model : string -> 'a
val simple_process : 'a -> 'b