Module Owl_nlp_utils

val regexp_split : Str.regexp
val _allocate_space : 'a array array -> 'a array array
val load_from_file : ?stopwords:( string, 'a ) Stdlib.Hashtbl.t -> string -> string array array
val load_from_string : ?stopwords:( string, 'a ) Stdlib.Hashtbl.t -> string -> string array
val load_stopwords : string -> ( string, int ) Stdlib.Hashtbl.t
val build_vocabulary : string array array -> ( string, int ) Stdlib.Hashtbl.t * ( int, string ) Stdlib.Hashtbl.t
val tokenise : ( 'a, 'b ) Stdlib.Hashtbl.t -> 'c array -> 'd array
val tokenise_all : ( 'a, 'b ) Stdlib.Hashtbl.t -> 'c array array -> 'd array array
val save_vocabulary : 'a -> string -> unit
val load_vocabulary : string -> 'a
val save_lda_model : 'a -> string -> unit
val load_lda_model : string -> 'a
val simple_process : 'a -> 'b