Utf8 (u.21bc00e2c735c27d55ddc3d761175d54.rdf.1.1.0.doc.rdf.Rdf.Utf8)

Sourceval utf8_nb_bytes_of_char : char -> int

Return the number of string taken by a the first byte (as character) of a UTF-8 character.

Sourceval utf8_index_of_char : string -> int -> int

utf8_index_of_char str n returns the position in byte of the nth character. n is 0-based.

raises Not_found
if there is no nth character.

Sourceval utf8_char_of_index : string -> int -> int

utf8_char_of_index str n returns the utf8 character position corresponding to the given byte index n.

Sourceval utf8_length : string -> int

utf8_string_length str returns the number of utf8 characters in str.

Sourceval utf8_substr : string -> int -> int -> string

utf8_substr str pos l returns the substring of str from utf8 position pos to pos+l-1.

Sourceval utf8_is_prefix : string -> string -> bool

utf8_is_prefix s1 s2 returns whether s2 is prefix of s1.

Sourceval utf8_is_suffix : string -> string -> bool

utf8_is_suffix s1 s2 returns whether s2 is suffix of s1.

Sourceval utf8_substr_pos : string -> string -> int option

utf8_substr_pos s1 s2 returns Some n if s2 is found at position n in s1, starting to search from the beginning of s1. Else return None.

Sourceval utf8_contains : string -> string -> bool

utf8_contains s1 s2 returns whether s1 contains s2.

Sourceval utf8_strbefore : string -> string -> string

utf8_strbefore s1 s2 returns the substring before s2 in s1. See details.

Sourceval utf8_strafter : string -> string -> string

utf8_strafter s1 s2 returns the substring after s2 in s1. See details.

Sourceval utf8_char_of_code : int32 -> string

utf8_char_of_code n return the UTF8 character from a given codepoint.

Sourceval utf8_get_bol : string -> (int * int) list

utf8_get_bol str returns the list of pairs (line number, char position) giving the position of beginning of each line in the given string.

Sourceval utf8_count_nl : string -> int

utf8_count_nl str returns the number of newline \n characters found in the given UTF-8 string.

Sourceval utf8_escape : string -> string

utf8_escape str \-escapes the following characters : \n, \r, \b, \t, \f, \(quotes), \' and \\ but does not escape \u nor \U.

Sourceval utf8_unescape : string -> string

utf8_unescape str unescapes the following escaped characters: \n, \r, \b, \t, \f, \quotes, \' and \\, and also \u... and \U... sequences.

Sourceval utf8_unescape_to_percent : string -> string

utf8_unescape_to_percent str unescapes the following escaped characters: \n, \r, \b, \t, \f, \quotes, \' and \\, and also \u... and \U... sequences to percent-encoded characters, to be parsable by an IRI parser.

Sourceval utf8_lowercase : string -> string

utf8_lowercase s returns a new string, with some characters mapped to corresponding lowercase characters.

Sourceval utf8_uppercase : string -> string

utf8_uppercase s returns a new string, with some characters mapped to corresponding uppercase characters.

Sourceval utf8_backslash_quotes : string -> string

utf8_backslash_quotes s returns a new string like s with a backslash before each double quotes.