sig
val unicode_version : string
type t = Uchar.t Pvec.t
val empty : Utext.t
val v : len:int -> Uchar.t -> Utext.t
val init : len:int -> (int -> Uchar.t) -> Utext.t
val of_uchar : Uchar.t -> Utext.t
val str : string -> Utext.t
val strf : ('a, Format.formatter, unit, Utext.t) Pervasives.format4 -> 'a
val is_empty : Utext.t -> bool
val equal : Utext.t -> Utext.t -> bool
val compare : Utext.t -> Utext.t -> int
val lowercased : Utext.t -> Utext.t
val uppercased : Utext.t -> Utext.t
val capitalized : Utext.t -> Utext.t
val uncapitalized : Utext.t -> Utext.t
val casefolded : Utext.t -> Utext.t
val canonical_caseless_key : Utext.t -> Utext.t
val compatibility_caseless_key : Utext.t -> Utext.t
val is_identifier : Utext.t -> bool
val identifier_caseless_key : Utext.t -> Utext.t
type newline = [ `ASCII | `NLF | `Readline ]
val lines :
?drop_empty:bool -> ?newline:Utext.newline -> Utext.t -> Utext.t Pvec.t
val paragraphs : ?drop_empty:bool -> Utext.t -> Utext.t Pvec.t
type normalization = [ `NFC | `NFD | `NFKC | `NFKD ]
val normalized : Utext.normalization -> Utext.t -> Utext.t
val is_normalized : Utext.normalization -> Utext.t -> bool
type boundary = [ `Grapheme_cluster | `Line_break | `Sentence | `Word ]
val segments : Utext.boundary -> Utext.t -> Utext.t Pvec.t
val segment_count : Utext.boundary -> Utext.t -> int
type pos = int
val boundaries : Utext.boundary -> Utext.t -> Utext.pos Pvec.t
val boundaries_mandatory :
Utext.boundary -> Utext.t -> (Utext.pos * bool) Pvec.t
val escaped : Utext.t -> Utext.t
val unescaped : Utext.t -> (Utext.t, int) Pervasives.result
val encoding_guess : string -> [ `UTF_16BE | `UTF_16LE | `UTF_8 ] * bool
val of_utf_8 : ?first:int -> ?last:int -> string -> Utext.t
val of_utf_16le : ?first:int -> ?last:int -> string -> Utext.t
val of_utf_16be : ?first:int -> ?last:int -> string -> Utext.t
type decode = (Utext.t, Utext.t * int * int option) Pervasives.result
val try_of_utf_8 : ?first:int -> ?last:int -> string -> Utext.decode
val try_of_utf_16le : ?first:int -> ?last:int -> string -> Utext.decode
val to_utf_8 : Utext.t -> string
val to_utf_16le : Utext.t -> string
val to_utf_16be : Utext.t -> string
val buffer_add_utf_8 : Buffer.t -> Utext.t -> unit
val buffer_add_utf_16le : Buffer.t -> Utext.t -> unit
val buffer_add_utf_16be : Buffer.t -> Utext.t -> unit
val pp : Format.formatter -> Utext.t -> unit
val pp_text : Format.formatter -> Utext.t -> unit
val pp_lines : Format.formatter -> Utext.t -> unit
val pp_uchars : Format.formatter -> Utext.t -> unit
val pp_toplevel : Format.formatter -> Utext.t -> unit
val pp_toplevel_pvec : Format.formatter -> Utext.t Pvec.t -> unit
end