UTF-8 utilities

|module-utf8_utils|

Constants

UTF8_ACCEPT = 0x0

|variable-utf8_utils-UTF8_ACCEPT|

Uncategorized

utf16_to_utf32(high: uint const; low: uint const)

utf16_to_utf32 returns uint

argument

argument type

high

uint const

low

uint const

|function-utf8_utils-utf16_to_utf32|

utf8_encode(dest_array: array<uint8>; ch: uint const)

argument

argument type

dest_array

array<uint8>

ch

uint const

Converts UTF-32 string to UTF-8 and returns it as a UTF-8 byte array

utf8_encode(ch: uint const)

utf8_encode returns array<uint8>

argument

argument type

ch

uint const

Converts UTF-32 string to UTF-8 and returns it as a UTF-8 byte array

utf8_encode(dest_array: array<uint8>; source_utf32_string: array<uint> const implicit)

argument

argument type

dest_array

array<uint8>

source_utf32_string

array<uint> const implicit

Converts UTF-32 string to UTF-8 and returns it as a UTF-8 byte array

utf8_encode(source_utf32_string: array<uint> const implicit)

utf8_encode returns array<uint8>

argument

argument type

source_utf32_string

array<uint> const implicit

Converts UTF-32 string to UTF-8 and returns it as a UTF-8 byte array

utf8_length(utf8_string: array<uint8> const implicit)

utf8_length returns int

argument

argument type

utf8_string

array<uint8> const implicit

Returns the number of characters in the UTF-8 string

utf8_length(utf8_string: string const)

utf8_length returns int

argument

argument type

utf8_string

string const

Returns the number of characters in the UTF-8 string

is_first_byte_of_utf8_char(ch: uint8 const)

is_first_byte_of_utf8_char returns bool

argument

argument type

ch

uint8 const

|function-utf8_utils-is_first_byte_of_utf8_char|

contains_utf8_bom(utf8_string: array<uint8> const implicit)

contains_utf8_bom returns bool

argument

argument type

utf8_string

array<uint8> const implicit

Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de> See http://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.

contains_utf8_bom(utf8_string: string const)

contains_utf8_bom returns bool

argument

argument type

utf8_string

string const

Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de> See http://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.

is_utf8_string_valid(utf8_string: array<uint8> const implicit)

is_utf8_string_valid returns bool

argument

argument type

utf8_string

array<uint8> const implicit

|function-utf8_utils-is_utf8_string_valid|

is_utf8_string_valid(utf8_string: string const)

is_utf8_string_valid returns bool

argument

argument type

utf8_string

string const

|function-utf8_utils-is_utf8_string_valid|

utf8_decode(dest_utf32_string: array<uint>; source_utf8_string: array<uint8> const implicit)

argument

argument type

dest_utf32_string

array<uint>

source_utf8_string

array<uint8> const implicit

Converts UTF-8 string to UTF-32 and appends it to the array of codepoints (UTF-32 string)

utf8_decode(source_utf8_string: array<uint8> const implicit)

utf8_decode returns array<uint>

argument

argument type

source_utf8_string

array<uint8> const implicit

Converts UTF-8 string to UTF-32 and appends it to the array of codepoints (UTF-32 string)

utf8_decode(source_utf8_string: string const)

utf8_decode returns array<uint>

argument

argument type

source_utf8_string

string const

Converts UTF-8 string to UTF-32 and appends it to the array of codepoints (UTF-32 string)

utf8_decode(dest_utf32_string: array<uint>; source_utf8_string: string const)

argument

argument type

dest_utf32_string

array<uint>

source_utf8_string

string const

Converts UTF-8 string to UTF-32 and appends it to the array of codepoints (UTF-32 string)

decode_unicode_escape(str: string const)

decode_unicode_escape returns string

argument

argument type

str

string const

|function-utf8_utils-decode_unicode_escape|