Up

module Unidata

: sig

Unicode data

#
module type Type = sig
#
val read_data : ?datadir:string -> string -> 'a
#
type general_category_type = [
| `Lu
| `Ll
| `Lt
| `Mn
| `Mc
| `Me
| `Nd
| `Nl
| `No
| `Zs
| `Zl
| `Zp
| `Cc
| `Cf
| `Cs
| `Co
| `Cn
| `Lm
| `Lo
| `Pc
| `Pd
| `Ps
| `Pe
| `Pi
| `Pf
| `Po
| `Sm
| `Sc
| `Sk
| `So
]
#
val cat_of_name : string -> general_category_type
#
val num_of_cat : general_category_type -> int
#
val cat_of_num : int -> general_category_type
#
type script_type = [
| `Common
| `Inherited
| `Latin
| `Greek
| `Cyrillic
| `Armenian
| `Hebrew
| `Arabic
| `Syriac
| `Thaana
| `Devanagari
| `Bengali
| `Gurmukhi
| `Gujarati
| `Oriya
| `Tamil
| `Telugu
| `Kannada
| `Malayalam
| `Sinhala
| `Thai
| `Lao
| `Tibetan
| `Myanmar
| `Georgian
| `Hangul
| `Ethiopic
| `Cherokee
| `Canadian_Aboriginal
| `Ogham
| `Runic
| `Khmer
| `Mongolian
| `Hiragana
| `Katakana
| `Bopomofo
| `Han
| `Yi
| `Old_Italic
| `Gothic
| `Deseret
| `Tagalog
| `Hanunoo
| `Buhid
| `Tagbanwa
]
#
val script_of_name : string -> script_type
#
val script_of_num : int -> script_type
#
val num_of_script : script_type -> int
#
type decomposition_type = [
| `Canon
| `Font
| `NoBreak
| `Initial
| `Medial
| `Final
| `Isolated
| `Circle
| `Super
| `Sub
| `Vertical
| `Wide
| `Narrow
| `Small
| `Square
| `Fraction
| `Compat
]
#
type decomposition_info = [
| `Canonform
| `HangulSyllable
| `Composite of decomposition_type * UChar.t list
]
#
type ce_type = int
#
val primary : ce_type -> int
#
val secondary : ce_type -> int
#
val tertiary : ce_type -> int
#
val compose_ce : int -> int -> int -> ce_type
#
val complete_ignorable : ce_type
#
type ce_tbl = (UChar.t list * ce_type list) list UCharTbl.t
#
type variable_option = [
| `Blanked
| `Non_ignorable
| `Shifted
| `Shift_Trimmed
]
#
type col_info = {
# variable_top
: int;
# variable_option
: variable_option;
# french_accent
: bool;
# hiraganaQ
: bool;
# hiraganaQ_weight
: int;
# tbl
: ce_tbl;
}
#
val get_col_info : ?locale:string -> unit -> col_info
#
val ce : ce_tbl -> UChar.t -> (UChar.t list * ce_type list) list
#
type localedata = {
# col_info
: col_info option;
}
end
#
module Make : functor (Config : ConfigInt.Type) -> Type
end