Up
module
Unidata
:
sig
Unicode data
#
module type
Type =
sig
#
val
read_data : ?datadir:string
->
string
->
'a
#
type
general_category_type = [
| `Lu
| `Ll
| `Lt
| `Mn
| `Mc
| `Me
| `Nd
| `Nl
| `No
| `Zs
| `Zl
| `Zp
| `Cc
| `Cf
| `Cs
| `Co
| `Cn
| `Lm
| `Lo
| `Pc
| `Pd
| `Ps
| `Pe
| `Pi
| `Pf
| `Po
| `Sm
| `Sc
| `Sk
| `So
]
#
val
cat_of_name : string
->
general_category_type
#
val
num_of_cat :
general_category_type
->
int
#
val
cat_of_num : int
->
general_category_type
#
type
script_type = [
| `Common
| `Inherited
| `Latin
| `Greek
| `Cyrillic
| `Armenian
| `Hebrew
| `Arabic
| `Syriac
| `Thaana
| `Devanagari
| `Bengali
| `Gurmukhi
| `Gujarati
| `Oriya
| `Tamil
| `Telugu
| `Kannada
| `Malayalam
| `Sinhala
| `Thai
| `Lao
| `Tibetan
| `Myanmar
| `Georgian
| `Hangul
| `Ethiopic
| `Cherokee
| `Canadian_Aboriginal
| `Ogham
| `Runic
| `Khmer
| `Mongolian
| `Hiragana
| `Katakana
| `Bopomofo
| `Han
| `Yi
| `Old_Italic
| `Gothic
| `Deseret
| `Tagalog
| `Hanunoo
| `Buhid
| `Tagbanwa
]
#
val
script_of_name : string
->
script_type
#
val
script_of_num : int
->
script_type
#
val
num_of_script :
script_type
->
int
#
type
decomposition_type = [
| `Canon
| `Font
| `NoBreak
| `Initial
| `Medial
| `Final
| `Isolated
| `Circle
| `Super
| `Sub
| `Vertical
| `Wide
| `Narrow
| `Small
| `Square
| `Fraction
| `Compat
]
#
type
decomposition_info = [
| `Canonform
| `HangulSyllable
| `Composite
of
decomposition_type
*
UChar
.
t
list
]
#
type
ce_type = int
#
val
primary :
ce_type
->
int
#
val
secondary :
ce_type
->
int
#
val
tertiary :
ce_type
->
int
#
val
compose_ce : int
->
int
->
int
->
ce_type
#
val
complete_ignorable :
ce_type
#
type
ce_tbl = (
UChar
.
t
list *
ce_type
list) list
UCharTbl
.
t
#
type
variable_option = [
| `Blanked
| `Non_ignorable
| `Shifted
| `Shift_Trimmed
]
#
type
col_info = {
#
variable_top
: int
;
#
variable_option
:
variable_option
;
#
french_accent
: bool
;
#
hiraganaQ
: bool
;
#
hiraganaQ_weight
: int
;
#
tbl
:
ce_tbl
;
}
#
val
get_col_info : ?locale:string
->
unit
->
col_info
#
val
ce :
ce_tbl
->
UChar
.
t
->
(
UChar
.
t
list *
ce_type
list) list
#
type
localedata = {
#
col_info
:
col_info
option
;
}
end
#
module
Make :
functor
(Config :
ConfigInt
.
Type
)
->
Type
end