Skip to content

Commit

Permalink
Update to Unicode 7.0.0
Browse files Browse the repository at this point in the history
  • Loading branch information
behdad committed Jul 9, 2014
1 parent 7156a17 commit b102f8e
Show file tree
Hide file tree
Showing 3 changed files with 2,023 additions and 1,727 deletions.
12 changes: 9 additions & 3 deletions makeunicodedata.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,7 @@
VERSION = "3.2"

# The Unicode Database
UNIDATA_VERSION = "6.2.0"
UNIDATA_VERSION = "7.0.0"
UNICODE_DATA = "UnicodeData%s.txt"
COMPOSITION_EXCLUSIONS = "CompositionExclusions%s.txt"
EASTASIAN_WIDTH = "EastAsianWidth%s.txt"
Expand Down Expand Up @@ -69,7 +69,7 @@

BIDIRECTIONAL_NAMES = [ "L", "LRE", "LRO", "R", "AL", "RLE", "RLO",
"PDF", "EN", "ES", "ET", "AN", "CS", "NSM", "BN", "B", "S", "WS",
"ON" ]
"ON" , "LRI", "RLI", "FSI", "PDI"]

SCRIPT_NAMES = [ "Common", "Latin", "Greek", "Cyrillic", "Armenian",
"Hebrew", "Arabic", "Syriac", "Thaana", "Devanagari", "Bengali",
Expand All @@ -89,7 +89,13 @@
"Imperial_Aramaic", "Old_South_Arabian", "Inscriptional_Parthian",
"Inscriptional_Pahlavi", "Old_Turkic", "Kaithi", "Batak", "Brahmi",
"Mandaic", "Chakma", "Meroitic_Cursive", "Meroitic_Hieroglyphs", "Miao",
"Sharada", "Sora_Sompeng", "Takri", "Unknown" ]
"Sharada", "Sora_Sompeng", "Takri", "Unknown", "Bassa_Vah",
"Caucasian_Albanian", "Duployan", "Elbasan", "Grantha", "Khojki",
"Khudawadi", "Linear_A", "Mahajani", "Manichaean", "Mende_Kikakui",
"Modi", "Mro", "Nabataean", "Old_North_Arabian", "Old_Permic",
"Pahawh_Hmong", "Palmyrene", "Pau_Cin_Hau", "Psalter_Pahlavi", "Siddham",
"Tirhuta", "Warang_Citi",
]

EASTASIANWIDTH_NAMES = [ "F", "H", "W", "Na", "A", "N" ]

Expand Down
27 changes: 27 additions & 0 deletions ucdn.h
Original file line number Diff line number Diff line change
Expand Up @@ -133,6 +133,29 @@ extern "C" {
#define UCDN_SCRIPT_SORA_SOMPENG 100
#define UCDN_SCRIPT_TAKRI 101
#define UCDN_SCRIPT_UNKNOWN 102
#define UCDN_SCRIPT_BASSA_VAH 103
#define UCDN_SCRIPT_CAUCASIAN_ALBANIAN 104
#define UCDN_SCRIPT_DUPLOYAN 105
#define UCDN_SCRIPT_ELBASAN 106
#define UCDN_SCRIPT_GRANTHA 107
#define UCDN_SCRIPT_KHOJKI 108
#define UCDN_SCRIPT_KHUDAWADI 109
#define UCDN_SCRIPT_LINEAR_A 110
#define UCDN_SCRIPT_MAHAJANI 111
#define UCDN_SCRIPT_MANICHAEAN 112
#define UCDN_SCRIPT_MENDE_KIKAKUI 113
#define UCDN_SCRIPT_MODI 114
#define UCDN_SCRIPT_MRO 115
#define UCDN_SCRIPT_NABATAEAN 116
#define UCDN_SCRIPT_OLD_NORTH_ARABIAN 117
#define UCDN_SCRIPT_OLD_PERMIC 118
#define UCDN_SCRIPT_PAHAWH_HMONG 119
#define UCDN_SCRIPT_PALMYRENE 120
#define UCDN_SCRIPT_PAU_CIN_HAU 121
#define UCDN_SCRIPT_PSALTER_PAHLAVI 122
#define UCDN_SCRIPT_SIDDHAM 123
#define UCDN_SCRIPT_TIRHUTA 124
#define UCDN_SCRIPT_WARANG_CITI 125

#define UCDN_GENERAL_CATEGORY_CC 0
#define UCDN_GENERAL_CATEGORY_CF 1
Expand Down Expand Up @@ -184,6 +207,10 @@ extern "C" {
#define UCDN_BIDI_CLASS_S 16
#define UCDN_BIDI_CLASS_WS 17
#define UCDN_BIDI_CLASS_ON 18
#define UCDN_BIDI_CLASS_LRI 19
#define UCDN_BIDI_CLASS_RLI 20
#define UCDN_BIDI_CLASS_FSI 21
#define UCDN_BIDI_CLASS_PDI 22

/**
* Return version of the Unicode database.
Expand Down
Loading

0 comments on commit b102f8e

Please sign in to comment.