diff options
Diffstat (limited to 'lib/unilbrk/lbrktables.h')
| -rw-r--r-- | lib/unilbrk/lbrktables.h | 60 | 
1 files changed, 32 insertions, 28 deletions
| diff --git a/lib/unilbrk/lbrktables.h b/lib/unilbrk/lbrktables.h index e86c49ff..ad72bc82 100644 --- a/lib/unilbrk/lbrktables.h +++ b/lib/unilbrk/lbrktables.h @@ -1,5 +1,5 @@  /* Line breaking auxiliary tables. -   Copyright (C) 2001-2003, 2006-2010 Free Software Foundation, Inc. +   Copyright (C) 2001-2003, 2006-2015 Free Software Foundation, Inc.     Written by Bruno Haible <bruno@clisp.org>, 2001.     This program is free software: you can redistribute it and/or modify it @@ -21,43 +21,47 @@  enum  { -  /* Values >= 24 are resolved at run time. */ -  LBP_BK = 24, /* mandatory break */ +  /* Values >= 27 are resolved at run time. */ +  LBP_BK = 27, /* mandatory break */  /*LBP_CR,         carriage return - not used here because it's a DOSism */  /*LBP_LF,         line feed - not used here because it's a DOSism */ -  LBP_CM = 25, /* attached characters and combining marks */ +  LBP_CM = 28, /* attached characters and combining marks */  /*LBP_NL,         next line - not used here because it's equivalent to LBP_BK */  /*LBP_SG,         surrogates - not used here because they are not characters */    LBP_WJ =  0, /* word joiner */ -  LBP_ZW = 26, /* zero width space */ +  LBP_ZW = 29, /* zero width space */    LBP_GL =  1, /* non-breaking (glue) */ -  LBP_SP = 27, /* space */ +  LBP_SP = 30, /* space */    LBP_B2 =  2, /* break opportunity before and after */    LBP_BA =  3, /* break opportunity after */    LBP_BB =  4, /* break opportunity before */    LBP_HY =  5, /* hyphen */ -  LBP_CB = 28, /* contingent break opportunity */ +  LBP_CB = 31, /* contingent break opportunity */    LBP_CL =  6, /* closing punctuation */ -  LBP_EX =  7, /* exclamation/interrogation */ -  LBP_IN =  8, /* inseparable */ -  LBP_NS =  9, /* non starter */ -  LBP_OP = 10, /* opening punctuation */ -  LBP_QU = 11, /* ambiguous quotation */ -  LBP_IS = 12, /* infix separator (numeric) */ -  LBP_NU = 13, /* numeric */ -  LBP_PO = 14, /* postfix (numeric) */ -  LBP_PR = 15, /* prefix (numeric) */ -  LBP_SY = 16, /* symbols allowing breaks */ -  LBP_AI = 29, /* ambiguous (alphabetic or ideograph) */ -  LBP_AL = 17, /* ordinary alphabetic and symbol characters */ -  LBP_H2 = 18, /* Hangul LV syllable */ -  LBP_H3 = 19, /* Hangul LVT syllable */ -  LBP_ID = 20, /* ideographic */ -  LBP_JL = 21, /* Hangul L Jamo */ -  LBP_JV = 22, /* Hangul V Jamo */ -  LBP_JT = 23, /* Hangul T Jamo */ -  LBP_SA = 30, /* complex context (South East Asian) */ -  LBP_XX = 31  /* unknown */ +  LBP_CP =  7, /* closing parenthesis */ +  LBP_EX =  8, /* exclamation/interrogation */ +  LBP_IN =  9, /* inseparable */ +  LBP_NS = 10, /* non starter */ +  LBP_OP = 11, /* opening punctuation */ +  LBP_QU = 12, /* ambiguous quotation */ +  LBP_IS = 13, /* infix separator (numeric) */ +  LBP_NU = 14, /* numeric */ +  LBP_PO = 15, /* postfix (numeric) */ +  LBP_PR = 16, /* prefix (numeric) */ +  LBP_SY = 17, /* symbols allowing breaks */ +  LBP_AI = 32, /* ambiguous (alphabetic or ideograph) */ +  LBP_AL = 18, /* ordinary alphabetic and symbol characters */ +/*LBP_CJ,         conditional Japanese starters, resolved to NS */ +  LBP_H2 = 19, /* Hangul LV syllable */ +  LBP_H3 = 20, /* Hangul LVT syllable */ +  LBP_HL = 25, /* Hebrew letter */ +  LBP_ID = 21, /* ideographic */ +  LBP_JL = 22, /* Hangul L Jamo */ +  LBP_JV = 23, /* Hangul V Jamo */ +  LBP_JT = 24, /* Hangul T Jamo */ +  LBP_RI = 26, /* regional indicator */ +  LBP_SA = 33, /* complex context (South East Asian) */ +  LBP_XX = 34  /* unknown */  };  #include "lbrkprop1.h" @@ -88,7 +92,7 @@ unilbrkprop_lookup (ucs4_t uc)  #define I 2  /* indirect break opportunity, '%' in table 7.3 of UTR #14 */  #define P 3  /* prohibited break,           '^' in table 7.3 of UTR #14 */ -extern const unsigned char unilbrk_table[24][24]; +extern const unsigned char unilbrk_table[27][27];  /* We don't support line breaking of complex-context dependent characters     (Thai, Lao, Myanmar, Khmer) yet, because it requires dictionary lookup. */ | 
