--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/graphicsdeviceinterface/gdi/sgdi/LineBreak.cpp Tue Feb 02 01:47:50 2010 +0200
@@ -0,0 +1,1990 @@
+// Copyright (c) 2006-2009 Nokia Corporation and/or its subsidiary(-ies).
+// All rights reserved.
+// This component and the accompanying materials are made available
+// under the terms of "Eclipse Public License v1.0"
+// which accompanies this distribution, and is available
+// at the URL "http://www.eclipse.org/legal/epl-v10.html".
+//
+// Initial Contributors:
+// Nokia Corporation - initial contribution.
+//
+// Contributors:
+//
+// Description:
+// This file was last edited on 09/04/2007. Please read the 'Unicode Character Data and Line Break data Update History.doc' file
+// for the latest updates.
+//
+//
+
+#include "LineBreak.h"
+#include "LineBreakImp.h"
+#include <e32std.h>
+#include <e32svr.h>
+
+_LIT(KLinebreakPanicCategory,"LineBreak");
+
+GLDEF_C void Panic(TInt aError)
+ {
+ User::Panic(KLinebreakPanicCategory,aError);
+ }
+
+const TUint KOpFlag = 1 << MLineBreaker::EOpLineBreakClass;
+const TUint KClFlag = 1 << MLineBreaker::EClLineBreakClass;
+const TUint KNsFlag = 1 << MLineBreaker::ENsLineBreakClass;
+const TUint KExFlag = 1 << MLineBreaker::EExLineBreakClass;
+const TUint KSyFlag = 1 << MLineBreaker::ESyLineBreakClass;
+const TUint KIsFlag = 1 << MLineBreaker::EIsLineBreakClass;
+const TUint KPrFlag = 1 << MLineBreaker::EPrLineBreakClass;
+const TUint KPoFlag = 1 << MLineBreaker::EPoLineBreakClass;
+const TUint KNuFlag = 1 << MLineBreaker::ENuLineBreakClass;
+const TUint KAlFlag = 1 << MLineBreaker::EAlLineBreakClass;
+const TUint KIdFlag = 1 << MLineBreaker::EIdLineBreakClass;
+const TUint KInFlag = 1 << MLineBreaker::EInLineBreakClass;
+const TUint KBbFlag = 1 << MLineBreaker::EBbLineBreakClass;
+const TUint KB2Flag = 1 << MLineBreaker::EB2LineBreakClass;
+const TUint KZwFlag = 1 << MLineBreaker::EZwLineBreakClass;
+const TUint KCmFlag = 1 << MLineBreaker::ECmLineBreakClass;
+const TUint KAiFlag = 1 << MLineBreaker::EAiLineBreakClass;
+
+const TUint KAiAlFlags = KAiFlag | KAlFlag;
+
+const TUint KAllBreaks = 0xFFFFFFFF;
+const TUint KUsualForbidden = KClFlag | KExFlag | KSyFlag | KIsFlag | KZwFlag;
+const TUint KUsualAllowed = KOpFlag | KPrFlag | KPoFlag | KNuFlag | KAiAlFlags | KIdFlag | KInFlag | KBbFlag | KB2Flag;
+
+const TUint KAlAllowed = KOpFlag | KPrFlag | KPoFlag | KIdFlag | KBbFlag | KB2Flag;
+
+// A table of break rules, indexed by the class of the character before the possible break.
+static const TLineBreakRule TheLineBreakRuleTable[MLineBreaker::ELineBreakClasses] =
+ {
+ { KAllBreaks - KCmFlag,0 }, // Op
+ { KUsualForbidden | KNsFlag,KUsualAllowed - KPoFlag }, // Cl
+ { KUsualForbidden | KOpFlag,0 }, // Qu
+ { KUsualForbidden, 0 }, // Gl
+ { KUsualForbidden, KUsualAllowed }, // Ns
+ { KUsualForbidden, KUsualAllowed }, // Ex
+ { KUsualForbidden, KUsualAllowed - KNuFlag }, // Sy
+ { KUsualForbidden, KUsualAllowed - KNuFlag }, // Is
+ { KUsualForbidden, KPrFlag | KPoFlag | KInFlag | KBbFlag | KB2Flag }, // Pr
+ { KUsualForbidden, KUsualAllowed }, // Po
+ { KUsualForbidden, KOpFlag | KPrFlag | KIdFlag | KBbFlag | KB2Flag }, // Nu
+ { KUsualForbidden, KAlAllowed }, // Al
+ { KUsualForbidden, KUsualAllowed - KPoFlag - KInFlag }, // Id
+ { KUsualForbidden, KUsualAllowed - KInFlag }, // In
+ { KUsualForbidden, KUsualAllowed }, // Hy
+ { KUsualForbidden, KUsualAllowed }, // Ba
+ { KUsualForbidden, 0 }, // Bb
+ { KUsualForbidden | KB2Flag, KUsualAllowed }, // B2
+ { KZwFlag, KAllBreaks - KZwFlag - KCmFlag}, // Zw
+ { KUsualForbidden, KOpFlag | KPrFlag | KPoFlag | KIdFlag | KBbFlag | KB2Flag }, // Cm
+ { 0, 0, }, // Bk
+ { 0, 0, }, // Cr
+ { 0, 0, }, // Lf
+ { 0, 0, }, // Sg
+ { 0, 0, }, // Cb
+ { KAllBreaks, 0, }, // Sp
+ { 0, 0, }, // Sa
+ { KUsualForbidden, KAlAllowed, }, // Ai
+ { 0, 0, } // Xx
+ };
+
+/**
+A sorted table of ranges of characters, with their line breaking classes.
+A range includes all codes for iStart <= code < iEnd.
+All these items have fixed range, please don't split any item into more or
+combine consecutive items even if they have the same property,
+because these change will cause mismatch with customer definition.
+*/
+static const TLineBreakRange TheLineBreakRangeTable[] =
+ {
+ { 0x0000, 0x0009, MLineBreaker::ECmLineBreakClass }, //<control>
+ { 0x0009, 0x000a, MLineBreaker::EBaLineBreakClass }, //<control>
+ { 0x000a, 0x000b, MLineBreaker::ELfLineBreakClass }, //<control>
+ { 0x000b, 0x000c, MLineBreaker::ECmLineBreakClass }, //<control>
+ { 0x000c, 0x000d, MLineBreaker::EBkLineBreakClass }, //<control>
+ { 0x000d, 0x000e, MLineBreaker::ECrLineBreakClass }, //<control>
+ { 0x000e, 0x0020, MLineBreaker::ECmLineBreakClass }, //<control>
+ { 0x0020, 0x0021, MLineBreaker::ESpLineBreakClass }, //space
+ { 0x0021, 0x0022, MLineBreaker::EExLineBreakClass }, //exclamation mark
+ { 0x0022, 0x0023, MLineBreaker::EQuLineBreakClass }, //quotation mark
+ { 0x0023, 0x0024, MLineBreaker::EAlLineBreakClass }, //number sign
+ { 0x0024, 0x0025, MLineBreaker::EPrLineBreakClass }, //dollar sign
+ { 0x0025, 0x0026, MLineBreaker::EPoLineBreakClass }, //percent sign
+ { 0x0026, 0x0027, MLineBreaker::EAlLineBreakClass }, //ampersand
+ { 0x0027, 0x0028, MLineBreaker::EQuLineBreakClass }, //apostrophe
+ { 0x0028, 0x0029, MLineBreaker::EOpLineBreakClass }, //left parenthesis
+ { 0x0029, 0x002a, MLineBreaker::EClLineBreakClass }, //right parenthesis
+ { 0x002a, 0x002b, MLineBreaker::EAlLineBreakClass }, //asterisk
+ { 0x002b, 0x002c, MLineBreaker::EPrLineBreakClass }, //plus sign
+ { 0x002c, 0x002d, MLineBreaker::EIsLineBreakClass }, //comma
+ { 0x002d, 0x002e, MLineBreaker::EHyLineBreakClass }, //hyphen-minus
+ { 0x002e, 0x002f, MLineBreaker::EIsLineBreakClass }, //full stop
+ { 0x002f, 0x0030, MLineBreaker::ESyLineBreakClass }, //solidus
+ { 0x0030, 0x003a, MLineBreaker::ENuLineBreakClass }, //digit zero
+ { 0x003a, 0x003c, MLineBreaker::EIsLineBreakClass }, //colon
+ { 0x003c, 0x003f, MLineBreaker::EAlLineBreakClass }, //less-than sign
+ { 0x003f, 0x0040, MLineBreaker::EExLineBreakClass }, //question mark
+ { 0x0040, 0x005b, MLineBreaker::EAlLineBreakClass }, //commercial at
+ { 0x005b, 0x005c, MLineBreaker::EOpLineBreakClass }, //left square bracket
+ { 0x005c, 0x005d, MLineBreaker::EPrLineBreakClass }, //reverse solidus
+ { 0x005d, 0x005e, MLineBreaker::EClLineBreakClass }, //right square bracket
+ { 0x005e, 0x005f, MLineBreaker::EAlLineBreakClass }, //circumflex accent
+ { 0x005f, 0x0060, MLineBreaker::EAlLineBreakClass }, //low line (underscore)
+ { 0x0060, 0x007b, MLineBreaker::EAlLineBreakClass }, //grave accent
+ { 0x007b, 0x007c, MLineBreaker::EOpLineBreakClass }, //left curly bracket
+ { 0x007c, 0x007d, MLineBreaker::EBaLineBreakClass }, //vertical line
+ { 0x007d, 0x007e, MLineBreaker::EClLineBreakClass }, //right curly bracket
+ { 0x007e, 0x007f, MLineBreaker::EAlLineBreakClass }, //tilde
+ { 0x007f, 0x00a0, MLineBreaker::ECmLineBreakClass }, //<control>
+ { 0x00a0, 0x00a1, MLineBreaker::EGlLineBreakClass }, //no-break space
+ { 0x00a1, 0x00a2, MLineBreaker::EAiLineBreakClass }, //inverted exclamation mark
+ { 0x00a2, 0x00a3, MLineBreaker::EPoLineBreakClass }, //cent sign
+ { 0x00a3, 0x00a6, MLineBreaker::EPrLineBreakClass }, //pound sign
+ { 0x00a6, 0x00a7, MLineBreaker::EAlLineBreakClass }, //broken bar
+ { 0x00a7, 0x00a9, MLineBreaker::EAiLineBreakClass }, //section sign
+ { 0x00a9, 0x00aa, MLineBreaker::EAlLineBreakClass }, //copyright sign
+ { 0x00aa, 0x00ab, MLineBreaker::EAiLineBreakClass }, //feminine ordinal indicator
+ { 0x00ab, 0x00ac, MLineBreaker::EQuLineBreakClass }, //left-pointing double angle quotation mark
+ { 0x00ac, 0x00ad, MLineBreaker::EAlLineBreakClass }, //not sign
+ { 0x00ad, 0x00ae, MLineBreaker::EBaLineBreakClass }, //soft hyphen
+ { 0x00ae, 0x00b0, MLineBreaker::EAlLineBreakClass }, //registered sign
+ { 0x00b0, 0x00b1, MLineBreaker::EPoLineBreakClass }, //degree sign
+ { 0x00b1, 0x00b2, MLineBreaker::EPrLineBreakClass }, //plus-minus sign
+ { 0x00b2, 0x00b4, MLineBreaker::EAiLineBreakClass }, //superscript two
+ { 0x00b4, 0x00b5, MLineBreaker::EBaLineBreakClass }, //acute accent
+ { 0x00b5, 0x00b6, MLineBreaker::EAlLineBreakClass }, //micro sign
+ { 0x00b6, 0x00bb, MLineBreaker::EAiLineBreakClass }, //pilcrow sign
+ { 0x00bb, 0x00bc, MLineBreaker::EQuLineBreakClass }, //right-pointing double angle quotation mark
+ { 0x00bc, 0x00c0, MLineBreaker::EAiLineBreakClass }, //vulgar fraction one quarter
+ { 0x00c0, 0x00c6, MLineBreaker::EAlLineBreakClass }, //latin capital letter a with grave
+ { 0x00c6, 0x00c7, MLineBreaker::EAiLineBreakClass }, //latin capital letter ae
+ { 0x00c7, 0x00d0, MLineBreaker::EAlLineBreakClass }, //latin capital letter c with cedilla
+ { 0x00d0, 0x00d1, MLineBreaker::EAiLineBreakClass }, //latin capital letter eth
+ { 0x00d1, 0x00d7, MLineBreaker::EAlLineBreakClass }, //latin capital letter n with tilde
+ { 0x00d7, 0x00d9, MLineBreaker::EAiLineBreakClass }, //multiplication sign
+ { 0x00d9, 0x00de, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with grave
+ { 0x00de, 0x00e2, MLineBreaker::EAiLineBreakClass }, //latin capital letter thorn
+ { 0x00e2, 0x00e6, MLineBreaker::EAlLineBreakClass }, //latin small letter a with circumflex
+ { 0x00e6, 0x00e7, MLineBreaker::EAiLineBreakClass }, //latin small letter ae
+ { 0x00e7, 0x00e8, MLineBreaker::EAlLineBreakClass }, //latin small letter c with cedilla
+ { 0x00e8, 0x00eb, MLineBreaker::EAiLineBreakClass }, //latin small letter e with grave
+ { 0x00eb, 0x00ec, MLineBreaker::EAlLineBreakClass }, //latin small letter e with diaeresis
+ { 0x00ec, 0x00ee, MLineBreaker::EAiLineBreakClass }, //latin small letter i with grave
+ { 0x00ee, 0x00f0, MLineBreaker::EAlLineBreakClass }, //latin small letter i with circumflex
+ { 0x00f0, 0x00f1, MLineBreaker::EAiLineBreakClass }, //latin small letter eth
+ { 0x00f1, 0x00f2, MLineBreaker::EAlLineBreakClass }, //latin small letter n with tilde
+ { 0x00f2, 0x00f4, MLineBreaker::EAiLineBreakClass }, //latin small letter o with grave
+ { 0x00f4, 0x00f7, MLineBreaker::EAlLineBreakClass }, //latin small letter o with circumflex
+ { 0x00f7, 0x00fb, MLineBreaker::EAiLineBreakClass }, //division sign
+ { 0x00fb, 0x00fc, MLineBreaker::EAlLineBreakClass }, //latin small letter u with circumflex
+ { 0x00fc, 0x00fd, MLineBreaker::EAiLineBreakClass }, //latin small letter u with diaeresis
+ { 0x00fd, 0x00fe, MLineBreaker::EAlLineBreakClass }, //latin small letter y with acute
+ { 0x00fe, 0x00ff, MLineBreaker::EAiLineBreakClass }, //latin small letter thorn
+ { 0x00ff, 0x0101, MLineBreaker::EAlLineBreakClass }, //latin small letter y with diaeresis
+ { 0x0101, 0x0102, MLineBreaker::EAiLineBreakClass }, //latin small letter a with macron
+ { 0x0102, 0x0111, MLineBreaker::EAlLineBreakClass }, //latin capital letter a with breve
+ { 0x0111, 0x0112, MLineBreaker::EAiLineBreakClass }, //latin small letter d with stroke
+ { 0x0112, 0x0113, MLineBreaker::EAlLineBreakClass }, //latin capital letter e with macron
+ { 0x0113, 0x0114, MLineBreaker::EAiLineBreakClass }, //latin small letter e with macron
+ { 0x0114, 0x011b, MLineBreaker::EAlLineBreakClass }, //latin capital letter e with breve
+ { 0x011b, 0x011c, MLineBreaker::EAiLineBreakClass }, //latin small letter e with caron
+ { 0x011c, 0x0126, MLineBreaker::EAlLineBreakClass }, //latin capital letter g with circumflex
+ { 0x0126, 0x0128, MLineBreaker::EAiLineBreakClass }, //latin capital letter h with stroke
+ { 0x0128, 0x012b, MLineBreaker::EAlLineBreakClass }, //latin capital letter i with tilde
+ { 0x012b, 0x012c, MLineBreaker::EAiLineBreakClass }, //latin small letter i with macron
+ { 0x012c, 0x0131, MLineBreaker::EAlLineBreakClass }, //latin capital letter i with breve
+ { 0x0131, 0x0134, MLineBreaker::EAiLineBreakClass }, //latin small letter dotless i
+ { 0x0134, 0x0138, MLineBreaker::EAlLineBreakClass }, //latin capital letter j with circumflex
+ { 0x0138, 0x0139, MLineBreaker::EAiLineBreakClass }, //latin small letter kra
+ { 0x0139, 0x013f, MLineBreaker::EAlLineBreakClass }, //latin capital letter l with acute
+ { 0x013f, 0x0143, MLineBreaker::EAiLineBreakClass }, //latin capital letter l with middle dot
+ { 0x0143, 0x0144, MLineBreaker::EAlLineBreakClass }, //latin capital letter n with acute
+ { 0x0144, 0x0145, MLineBreaker::EAiLineBreakClass }, //latin small letter n with acute
+ { 0x0145, 0x0148, MLineBreaker::EAlLineBreakClass }, //latin capital letter n with cedilla
+ { 0x0148, 0x014b, MLineBreaker::EAiLineBreakClass }, //latin small letter n with caron
+ { 0x014b, 0x014d, MLineBreaker::EAlLineBreakClass }, //latin small letter eng
+ { 0x014d, 0x014e, MLineBreaker::EAiLineBreakClass }, //latin small letter o with macron
+ { 0x014e, 0x0152, MLineBreaker::EAlLineBreakClass }, //latin capital letter o with breve
+ { 0x0152, 0x0154, MLineBreaker::EAiLineBreakClass }, //latin capital ligature oe
+ { 0x0154, 0x0166, MLineBreaker::EAlLineBreakClass }, //latin capital letter r with acute
+ { 0x0166, 0x0168, MLineBreaker::EAiLineBreakClass }, //latin capital letter t with stroke
+ { 0x0168, 0x016b, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with tilde
+ { 0x016b, 0x016c, MLineBreaker::EAiLineBreakClass }, //latin small letter u with macron
+ { 0x016c, 0x01ce, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with breve
+ { 0x01ce, 0x01cf, MLineBreaker::EAiLineBreakClass }, //latin small letter a with caron
+ { 0x01cf, 0x01d0, MLineBreaker::EAlLineBreakClass }, //latin capital letter i with caron
+ { 0x01d0, 0x01d1, MLineBreaker::EAiLineBreakClass }, //latin small letter i with caron
+ { 0x01d1, 0x01d2, MLineBreaker::EAlLineBreakClass }, //latin capital letter o with caron
+ { 0x01d2, 0x01d3, MLineBreaker::EAiLineBreakClass }, //latin small letter o with caron
+ { 0x01d3, 0x01d4, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with caron
+ { 0x01d4, 0x01d5, MLineBreaker::EAiLineBreakClass }, //latin small letter u with caron
+ { 0x01d5, 0x01d6, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with diaeresis and macron
+ { 0x01d6, 0x01d7, MLineBreaker::EAiLineBreakClass }, //latin small letter u with diaeresis and macron
+ { 0x01d7, 0x01d8, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with diaeresis and acute
+ { 0x01d8, 0x01d9, MLineBreaker::EAiLineBreakClass }, //latin small letter u with diaeresis and acute
+ { 0x01d9, 0x01da, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with diaeresis and caron
+ { 0x01da, 0x01db, MLineBreaker::EAiLineBreakClass }, //latin small letter u with diaeresis and caron
+ { 0x01db, 0x01dc, MLineBreaker::EAlLineBreakClass }, //latin capital letter u with diaeresis and grave
+ { 0x01dc, 0x01dd, MLineBreaker::EAiLineBreakClass }, //latin small letter u with diaeresis and grave
+ { 0x01dd, 0x0250, MLineBreaker::EAlLineBreakClass }, //latin small letter turned e
+ { 0x0250, 0x0251, MLineBreaker::EAlLineBreakClass }, //latin small letter turned a
+ { 0x0251, 0x0252, MLineBreaker::EAiLineBreakClass }, //latin small letter alpha
+ { 0x0252, 0x0261, MLineBreaker::EAlLineBreakClass }, //latin small letter turned alpha
+ { 0x0261, 0x0262, MLineBreaker::EAiLineBreakClass }, //latin small letter script g
+ { 0x0262, 0x02c7, MLineBreaker::EAlLineBreakClass }, //latin letter small capital g
+ { 0x02c7, 0x02c8, MLineBreaker::EAiLineBreakClass }, //caron
+ { 0x02c8, 0x02c9, MLineBreaker::EBbLineBreakClass }, //modifier letter vertical line
+ { 0x02c9, 0x02cc, MLineBreaker::EAiLineBreakClass }, //modifier letter macron
+ { 0x02cc, 0x02cd, MLineBreaker::EBbLineBreakClass }, //modifier letter low vertical line
+ { 0x02cd, 0x02ce, MLineBreaker::EAiLineBreakClass }, //modifier letter low macron
+ { 0x02ce, 0x02d0, MLineBreaker::EAlLineBreakClass }, //modifier letter low grave accent
+ { 0x02d0, 0x02d1, MLineBreaker::EAiLineBreakClass }, //modifier letter triangular colon
+ { 0x02d1, 0x02d8, MLineBreaker::EAlLineBreakClass }, //modifier letter half triangular colon
+ { 0x02d8, 0x02dc, MLineBreaker::EAiLineBreakClass }, //breve
+ { 0x02dc, 0x02dd, MLineBreaker::EAlLineBreakClass }, //small tilde
+ { 0x02dd, 0x02de, MLineBreaker::EAiLineBreakClass }, //double acute accent
+ { 0x02de, 0x0300, MLineBreaker::EAlLineBreakClass }, //modifier letter rhotic hook
+ { 0x0300, 0x034f, MLineBreaker::ECmLineBreakClass }, //combining grave accent
+ { 0x034f, 0x0350, MLineBreaker::EGlLineBreakClass }, //COMBINING GRAPHEME JOINER
+ { 0x0350, 0x035c, MLineBreaker::ECmLineBreakClass }, //COMBINING RIGHT ARROWHEAD ABOVE
+ { 0x035c, 0x0360, MLineBreaker::EGlLineBreakClass }, //COMBINING DOUBLE BREVE BELOW
+ { 0x0360, 0x0370, MLineBreaker::ECmLineBreakClass }, //combining double tilde
+ { 0x0374, 0x0376, MLineBreaker::EAlLineBreakClass }, //greek numeral sign
+ { 0x037a, 0x037b, MLineBreaker::EAlLineBreakClass }, //greek ypogegrammeni
+ { 0x037b, 0x037e, MLineBreaker::EAlLineBreakClass }, //GREEK SMALL REVERSED LUNATE SIGMA SYMBOL
+ { 0x037e, 0x037f, MLineBreaker::EAlLineBreakClass }, //greek question mark
+ { 0x0384, 0x038b, MLineBreaker::EAlLineBreakClass }, //greek tonos
+ { 0x038c, 0x038d, MLineBreaker::EAlLineBreakClass }, //greek capital letter omicron with tonos
+ { 0x038e, 0x0391, MLineBreaker::EAlLineBreakClass }, //greek capital letter upsilon with tonos
+ { 0x0391, 0x03a2, MLineBreaker::EAiLineBreakClass }, //greek capital letter alpha
+ { 0x03a3, 0x03aa, MLineBreaker::EAiLineBreakClass }, //greek capital letter sigma
+ { 0x03aa, 0x03b1, MLineBreaker::EAlLineBreakClass }, //greek capital letter iota with dialytika
+ { 0x03b1, 0x03c2, MLineBreaker::EAiLineBreakClass }, //greek small letter alpha
+ { 0x03c2, 0x03c3, MLineBreaker::EAlLineBreakClass }, //greek small letter final sigma
+ { 0x03c3, 0x03ca, MLineBreaker::EAiLineBreakClass }, //greek small letter sigma
+ { 0x03ca, 0x03cf, MLineBreaker::EAlLineBreakClass }, //greek small letter iota with dialytika
+ { 0x03d0, 0x0400, MLineBreaker::EAlLineBreakClass }, //greek beta symbol
+ { 0x0400, 0x0401, MLineBreaker::EAlLineBreakClass }, //cyrillic capital letter ie with grave
+ { 0x0401, 0x0402, MLineBreaker::EAiLineBreakClass }, //cyrillic capital letter io
+ { 0x0402, 0x0410, MLineBreaker::EAlLineBreakClass }, //cyrillic capital letter dje
+ { 0x0410, 0x0450, MLineBreaker::EAiLineBreakClass }, //cyrillic capital letter a
+ { 0x0450, 0x0451, MLineBreaker::EAlLineBreakClass }, //cyrillic small letter ie with grave
+ { 0x0451, 0x0452, MLineBreaker::EAiLineBreakClass }, //cyrillic small letter io
+ { 0x0452, 0x0483, MLineBreaker::EAlLineBreakClass }, //cyrillic small letter dje
+ { 0x0483, 0x0487, MLineBreaker::ECmLineBreakClass }, //combining cyrillic titlo
+ { 0x0488, 0x048a, MLineBreaker::ECmLineBreakClass }, //combining cyrillic hundred thousands sign
+ { 0x048a, 0x0514, MLineBreaker::EAlLineBreakClass }, //CYRILLIC CAPITAL LETTER SHORT I WITH TAIL
+ { 0x0531, 0x0557, MLineBreaker::EAlLineBreakClass }, //armenian capital letter ayb
+ { 0x0559, 0x0560, MLineBreaker::EAlLineBreakClass }, //armenian modifier letter left half ring
+ { 0x0561, 0x0588, MLineBreaker::EAlLineBreakClass }, //armenian small letter ayb
+ { 0x0589, 0x058a, MLineBreaker::EIsLineBreakClass }, //armenian full stop
+ { 0x058a, 0x058b, MLineBreaker::EBaLineBreakClass }, //armenian hyphen
+ { 0x0591, 0x05be, MLineBreaker::ECmLineBreakClass }, //hebrew accent etnahta
+ { 0x05be, 0x05bf, MLineBreaker::EAlLineBreakClass }, //hebrew punctuation maqaf
+ { 0x05bf, 0x05c0, MLineBreaker::ECmLineBreakClass }, //hebrew point rafe
+ { 0x05c0, 0x05c1, MLineBreaker::EAlLineBreakClass }, //hebrew punctuation paseq
+ { 0x05c1, 0x05c3, MLineBreaker::ECmLineBreakClass }, //hebrew point shin dot
+ { 0x05c3, 0x05c4, MLineBreaker::EAlLineBreakClass }, //hebrew punctuation sof pasuq
+ { 0x05c4, 0x05c5, MLineBreaker::ECmLineBreakClass }, //hebrew mark upper dot
+ { 0x05c5, 0x05c6, MLineBreaker::ECmLineBreakClass }, //HEBREW MARK LOWER DOT
+ { 0x05c6, 0x05c7, MLineBreaker::EExLineBreakClass }, //HEBREW PUNCTUATION NUN HAFUKHA
+ { 0x05c7, 0x05c8, MLineBreaker::ECmLineBreakClass }, //HEBREW POINT QAMATS QATAN
+ { 0x05d0, 0x05eb, MLineBreaker::EAlLineBreakClass }, //hebrew letter alef
+ { 0x05f0, 0x05f5, MLineBreaker::EAlLineBreakClass }, //hebrew ligature yiddish double vav
+ { 0x0600, 0x0604, MLineBreaker::EAlLineBreakClass }, //ARABIC NUMBER SIGN
+ { 0x060b, 0x060c, MLineBreaker::EPoLineBreakClass }, //AFGHANI SIGN
+ { 0x060c, 0x060d, MLineBreaker::EExLineBreakClass }, //arabic comma
+ { 0x060d, 0x060e, MLineBreaker::EIsLineBreakClass }, //ARABIC DATE SEPARATOR
+ { 0x060e, 0x0610, MLineBreaker::EAlLineBreakClass }, //ARABIC POETIC VERSE SIGN
+ { 0x0610, 0x0616, MLineBreaker::ECmLineBreakClass }, //ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM
+ { 0x061b, 0x061c, MLineBreaker::EExLineBreakClass }, //arabic semicolon
+ { 0x061e, 0x061f, MLineBreaker::EExLineBreakClass }, //ARABIC TRIPLE DOT PUNCTUATION MARK
+ { 0x061f, 0x0620, MLineBreaker::EExLineBreakClass }, //arabic question mark
+ { 0x0621, 0x063b, MLineBreaker::EAlLineBreakClass }, //arabic letter hamza
+ { 0x0640, 0x064b, MLineBreaker::EAlLineBreakClass }, //arabic tatweel
+ { 0x064b, 0x065f, MLineBreaker::ECmLineBreakClass }, //arabic fathatan
+ { 0x0660, 0x066a, MLineBreaker::ENuLineBreakClass }, //arabic-indic digit zero
+ { 0x066a, 0x066b, MLineBreaker::EExLineBreakClass }, //arabic percent sign
+ { 0x066b, 0x066d, MLineBreaker::ENuLineBreakClass }, //arabic decimal & thousands separator
+ { 0x066d, 0x066e, MLineBreaker::EAlLineBreakClass }, //arabic five pointed star
+ { 0x066e, 0x0670, MLineBreaker::EAlLineBreakClass }, //arabic five pointed star
+ { 0x0670, 0x0671, MLineBreaker::ECmLineBreakClass }, //arabic letter superscript alef
+ { 0x0671, 0x06d4, MLineBreaker::EAlLineBreakClass }, //arabic letter alef wasla
+ { 0x06d4, 0x06d5, MLineBreaker::EExLineBreakClass }, //arabic full stop
+ { 0x06d5, 0x06d6, MLineBreaker::EAlLineBreakClass }, //arabic letter ae
+ { 0x06d6, 0x06e5, MLineBreaker::ECmLineBreakClass }, //arabic small high ligature sad with lam with alef maksura
+ { 0x06e5, 0x06e7, MLineBreaker::EAlLineBreakClass }, //arabic small waw
+ { 0x06e7, 0x06e9, MLineBreaker::ECmLineBreakClass }, //arabic small high yeh
+ { 0x06e9, 0x06ea, MLineBreaker::EAlLineBreakClass }, //arabic place of sajdah
+ { 0x06ea, 0x06ee, MLineBreaker::ECmLineBreakClass }, //arabic empty centre low stop
+ { 0x06ee, 0x06f0, MLineBreaker::EAlLineBreakClass }, //ARABIC LETTER DAL WITH INVERTED V
+ { 0x06f0, 0x06fa, MLineBreaker::ENuLineBreakClass }, //extended arabic-indic digit zero
+ { 0x06fa, 0x070e, MLineBreaker::EAlLineBreakClass }, //arabic letter sheen with dot below
+ { 0x070f, 0x0710, MLineBreaker::ECmLineBreakClass }, //syriac abbreviation mark
+ { 0x0710, 0x0711, MLineBreaker::EAlLineBreakClass }, //syriac letter alaph
+ { 0x0711, 0x0712, MLineBreaker::ECmLineBreakClass }, //syriac letter superscript alaph
+ { 0x0712, 0x0730, MLineBreaker::EAlLineBreakClass }, //syriac letter beth
+ { 0x0730, 0x074b, MLineBreaker::ECmLineBreakClass }, //syriac pthaha above
+ { 0x074d, 0x076e, MLineBreaker::EAlLineBreakClass }, //SYRIAC LETTER SOGDIAN ZHAIN
+ { 0x0780, 0x07a6, MLineBreaker::EAlLineBreakClass }, //thaana letter haa
+ { 0x07a6, 0x07b1, MLineBreaker::ECmLineBreakClass }, //thaana abafili
+ { 0x07b1, 0x07b2, MLineBreaker::EAlLineBreakClass }, //THAANA LETTER NAA
+ { 0x07c0, 0x07ca, MLineBreaker::ENuLineBreakClass }, //NKO DIGIT ZERO
+ { 0x07ca, 0x07eb, MLineBreaker::EAlLineBreakClass }, //NKO LETTER A
+ { 0x07eb, 0x07f4, MLineBreaker::ECmLineBreakClass }, //NKO COMBINING SHORT HIGH TONE
+ { 0x07f4, 0x07f8, MLineBreaker::EAlLineBreakClass }, //NKO HIGH TONE APOSTROPHE
+ { 0x07f8, 0x07f9, MLineBreaker::EIsLineBreakClass }, //NKO COMMA
+ { 0x07f9, 0x07fa, MLineBreaker::EExLineBreakClass }, //NKO EXCLAMATION MARK
+ { 0x07fa, 0x07fb, MLineBreaker::EAlLineBreakClass }, //NKO LAJANYALAN
+ { 0x0901, 0x0904, MLineBreaker::ECmLineBreakClass }, //devanagari sign candrabindu
+ { 0x0904, 0x093a, MLineBreaker::EAlLineBreakClass }, //devanagari letter short a: CR1080
+ { 0x093c, 0x093d, MLineBreaker::ECmLineBreakClass }, //devanagari sign nukta
+ { 0x093d, 0x093e, MLineBreaker::EAlLineBreakClass }, //devanagari sign avagraha
+ { 0x093e, 0x094e, MLineBreaker::ECmLineBreakClass }, //devanagari vowel sign aa
+ { 0x0950, 0x0951, MLineBreaker::EAlLineBreakClass }, //devanagari om
+ { 0x0951, 0x0955, MLineBreaker::ECmLineBreakClass }, //devanagari stress sign udatta
+ { 0x0958, 0x0962, MLineBreaker::EAlLineBreakClass }, //devanagari letter qa
+ { 0x0962, 0x0964, MLineBreaker::ECmLineBreakClass }, //devanagari vowel sign vocalic l
+ { 0x0964, 0x0966, MLineBreaker::EAlLineBreakClass }, //devanagari danda
+ { 0x0966, 0x0970, MLineBreaker::ENuLineBreakClass }, //devanagari digit zero
+ { 0x0970, 0x0971, MLineBreaker::EAlLineBreakClass }, //devanagari abbreviation sign
+ { 0x097b, 0x0980, MLineBreaker::EAlLineBreakClass }, //devanagari letter gga: CR1080
+ { 0x0981, 0x0984, MLineBreaker::ECmLineBreakClass }, //bengali sign candrabindu
+ { 0x0985, 0x098d, MLineBreaker::EAlLineBreakClass }, //bengali letter a
+ { 0x098f, 0x0991, MLineBreaker::EAlLineBreakClass }, //bengali letter e
+ { 0x0993, 0x09a9, MLineBreaker::EAlLineBreakClass }, //bengali letter o
+ { 0x09aa, 0x09b1, MLineBreaker::EAlLineBreakClass }, //bengali letter pa
+ { 0x09b2, 0x09b3, MLineBreaker::EAlLineBreakClass }, //bengali letter la
+ { 0x09b6, 0x09ba, MLineBreaker::EAlLineBreakClass }, //bengali letter sha
+ { 0x09bc, 0x09bd, MLineBreaker::ECmLineBreakClass }, //bengali sign nukta
+ { 0x09bd, 0x09be, MLineBreaker::EAlLineBreakClass }, //bengali sign avagraha: CR1080
+ { 0x09be, 0x09c5, MLineBreaker::ECmLineBreakClass }, //bengali vowel sign aa
+ { 0x09c7, 0x09c9, MLineBreaker::ECmLineBreakClass }, //bengali vowel sign e
+ { 0x09cb, 0x09ce, MLineBreaker::ECmLineBreakClass }, //bengali vowel sign o
+ { 0x09ce, 0x09cf, MLineBreaker::EAlLineBreakClass }, //bengali letter khanda ta: CR1080
+ { 0x09d7, 0x09d8, MLineBreaker::ECmLineBreakClass }, //bengali au length mark
+ { 0x09dc, 0x09de, MLineBreaker::EAlLineBreakClass }, //bengali letter rra
+ { 0x09df, 0x09e2, MLineBreaker::EAlLineBreakClass }, //bengali letter yya
+ { 0x09e2, 0x09e4, MLineBreaker::ECmLineBreakClass }, //bengali vowel sign vocalic l
+ { 0x09e6, 0x09f0, MLineBreaker::ENuLineBreakClass }, //bengali digit zero
+ { 0x09f0, 0x09f2, MLineBreaker::EAlLineBreakClass }, //bengali letter ra with middle diagonal
+ { 0x09f2, 0x09f4, MLineBreaker::EPrLineBreakClass }, //bengali rupee mark
+ { 0x09f4, 0x09fb, MLineBreaker::EAlLineBreakClass }, //bengali currency numerator one
+ { 0x0a01, 0x0a04, MLineBreaker::ECmLineBreakClass }, //gurmukhi sign adak bindi: CR1080
+ { 0x0a05, 0x0a0b, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter a
+ { 0x0a0f, 0x0a11, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter ee
+ { 0x0a13, 0x0a29, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter oo
+ { 0x0a2a, 0x0a31, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter pa
+ { 0x0a32, 0x0a34, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter la
+ { 0x0a35, 0x0a37, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter va
+ { 0x0a38, 0x0a3a, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter sa
+ { 0x0a3c, 0x0a3d, MLineBreaker::ECmLineBreakClass }, //gurmukhi sign nukta
+ { 0x0a3e, 0x0a43, MLineBreaker::ECmLineBreakClass }, //gurmukhi vowel sign aa
+ { 0x0a47, 0x0a49, MLineBreaker::ECmLineBreakClass }, //gurmukhi vowel sign ee
+ { 0x0a4b, 0x0a4e, MLineBreaker::ECmLineBreakClass }, //gurmukhi vowel sign oo
+ { 0x0a59, 0x0a5d, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter khha
+ { 0x0a5e, 0x0a5f, MLineBreaker::EAlLineBreakClass }, //gurmukhi letter fa
+ { 0x0a66, 0x0a70, MLineBreaker::ENuLineBreakClass }, //gurmukhi digit zero
+ { 0x0a70, 0x0a72, MLineBreaker::ECmLineBreakClass }, //gurmukhi tippi
+ { 0x0a72, 0x0a75, MLineBreaker::EAlLineBreakClass }, //gurmukhi iri
+ { 0x0a81, 0x0a84, MLineBreaker::ECmLineBreakClass }, //gujarati sign candrabindu
+ { 0x0a85, 0x0a8d, MLineBreaker::EAlLineBreakClass }, //gujarati letter a: CR1080
+ { 0x0a8d, 0x0a8e, MLineBreaker::EAlLineBreakClass }, //gujarati vowel candra e
+ { 0x0a8f, 0x0a92, MLineBreaker::EAlLineBreakClass }, //gujarati letter e
+ { 0x0a93, 0x0aa9, MLineBreaker::EAlLineBreakClass }, //gujarati letter o
+ { 0x0aaa, 0x0ab1, MLineBreaker::EAlLineBreakClass }, //gujarati letter pa
+ { 0x0ab2, 0x0ab4, MLineBreaker::EAlLineBreakClass }, //gujarati letter la
+ { 0x0ab5, 0x0aba, MLineBreaker::EAlLineBreakClass }, //gujarati letter va
+ { 0x0abc, 0x0abd, MLineBreaker::ECmLineBreakClass }, //gujarati sign nukta
+ { 0x0abd, 0x0abe, MLineBreaker::EAlLineBreakClass }, //gujarati sign avagraha
+ { 0x0abe, 0x0ac6, MLineBreaker::ECmLineBreakClass }, //gujarati vowel sign aa
+ { 0x0ac7, 0x0aca, MLineBreaker::ECmLineBreakClass }, //gujarati vowel sign e
+ { 0x0acb, 0x0ace, MLineBreaker::ECmLineBreakClass }, //gujarati vowel sign o
+ { 0x0ad0, 0x0ad1, MLineBreaker::EAlLineBreakClass }, //gujarati om
+ { 0x0ae0, 0x0ae2, MLineBreaker::EAlLineBreakClass }, //gujarati letter vocalic rr: CR1080
+ { 0x0ae2, 0x0ae4, MLineBreaker::ECmLineBreakClass }, //gujarati vowel sign vocalic l: CR1080
+ { 0x0ae6, 0x0af0, MLineBreaker::ENuLineBreakClass }, //gujarati digit zero
+ { 0x0af1, 0x0af2, MLineBreaker::EPrLineBreakClass }, //gujarati rupee sign: CR1080
+ { 0x0b01, 0x0b04, MLineBreaker::ECmLineBreakClass }, //oriya sign candrabindu
+ { 0x0b05, 0x0b0d, MLineBreaker::EAlLineBreakClass }, //oriya letter a
+ { 0x0b0f, 0x0b11, MLineBreaker::EAlLineBreakClass }, //oriya letter e
+ { 0x0b13, 0x0b29, MLineBreaker::EAlLineBreakClass }, //oriya letter o
+ { 0x0b2a, 0x0b31, MLineBreaker::EAlLineBreakClass }, //oriya letter pa
+ { 0x0b32, 0x0b34, MLineBreaker::EAlLineBreakClass }, //oriya letter la
+ { 0x0b35, 0x0b36, MLineBreaker::EAlLineBreakClass }, //oriya letter va: CR1080
+ { 0x0b36, 0x0b3a, MLineBreaker::EAlLineBreakClass }, //oriya letter sha
+ { 0x0b3c, 0x0b3d, MLineBreaker::ECmLineBreakClass }, //oriya sign nukta
+ { 0x0b3d, 0x0b3e, MLineBreaker::EAlLineBreakClass }, //oriya sign avagraha
+ { 0x0b3e, 0x0b44, MLineBreaker::ECmLineBreakClass }, //oriya vowel sign aa
+ { 0x0b47, 0x0b49, MLineBreaker::ECmLineBreakClass }, //oriya vowel sign e
+ { 0x0b4b, 0x0b4e, MLineBreaker::ECmLineBreakClass }, //oriya vowel sign o
+ { 0x0b56, 0x0b58, MLineBreaker::ECmLineBreakClass }, //oriya ai length mark
+ { 0x0b5c, 0x0b5e, MLineBreaker::EAlLineBreakClass }, //oriya letter rra
+ { 0x0b5f, 0x0b62, MLineBreaker::EAlLineBreakClass }, //oriya letter yya
+ { 0x0b66, 0x0b70, MLineBreaker::ENuLineBreakClass }, //oriya digit zero
+ { 0x0b70, 0x0b71, MLineBreaker::EAlLineBreakClass }, //oriya isshar
+ { 0x0b71, 0x0b72, MLineBreaker::EAlLineBreakClass }, //oriya letter wa: CR1080
+ { 0x0b82, 0x0b84, MLineBreaker::ECmLineBreakClass }, //tamil sign anusvara
+ { 0x0b85, 0x0b8b, MLineBreaker::EAlLineBreakClass }, //tamil letter a
+ { 0x0b8e, 0x0b91, MLineBreaker::EAlLineBreakClass }, //tamil letter e
+ { 0x0b92, 0x0b96, MLineBreaker::EAlLineBreakClass }, //tamil letter o
+ { 0x0b99, 0x0b9b, MLineBreaker::EAlLineBreakClass }, //tamil letter nga
+ { 0x0b9c, 0x0b9d, MLineBreaker::EAlLineBreakClass }, //tamil letter ja
+ { 0x0b9e, 0x0ba0, MLineBreaker::EAlLineBreakClass }, //tamil letter nya
+ { 0x0ba3, 0x0ba5, MLineBreaker::EAlLineBreakClass }, //tamil letter nna
+ { 0x0ba8, 0x0bab, MLineBreaker::EAlLineBreakClass }, //tamil letter na
+ { 0x0bae, 0x0bba, MLineBreaker::EAlLineBreakClass }, //tamil letter ma: CR1080
+ { 0x0bbe, 0x0bc3, MLineBreaker::ECmLineBreakClass }, //tamil vowel sign aa
+ { 0x0bc6, 0x0bc9, MLineBreaker::ECmLineBreakClass }, //tamil vowel sign e
+ { 0x0bca, 0x0bce, MLineBreaker::ECmLineBreakClass }, //tamil vowel sign o
+ { 0x0bd7, 0x0bd8, MLineBreaker::ECmLineBreakClass }, //tamil au length mark
+ { 0x0be6, 0x0bf0, MLineBreaker::ENuLineBreakClass }, //tamil digit one: CR1080
+ { 0x0bf0, 0x0bf9, MLineBreaker::EAlLineBreakClass }, //tamil number ten: CR1080
+ { 0x0bf9, 0x0bfa, MLineBreaker::EPrLineBreakClass }, //tamil rupee sign: CR1080
+ { 0x0bfa, 0x0bfb, MLineBreaker::EAlLineBreakClass }, //tamil number sign: CR1080
+ { 0x0c01, 0x0c04, MLineBreaker::ECmLineBreakClass }, //telugu sign candrabindu
+ { 0x0c05, 0x0c0d, MLineBreaker::EAlLineBreakClass }, //telugu letter a
+ { 0x0c0e, 0x0c11, MLineBreaker::EAlLineBreakClass }, //telugu letter e
+ { 0x0c12, 0x0c29, MLineBreaker::EAlLineBreakClass }, //telugu letter o
+ { 0x0c2a, 0x0c34, MLineBreaker::EAlLineBreakClass }, //telugu letter pa
+ { 0x0c35, 0x0c3a, MLineBreaker::EAlLineBreakClass }, //telugu letter va
+ { 0x0c3e, 0x0c45, MLineBreaker::ECmLineBreakClass }, //telugu vowel sign aa
+ { 0x0c46, 0x0c49, MLineBreaker::ECmLineBreakClass }, //telugu vowel sign e
+ { 0x0c4a, 0x0c4e, MLineBreaker::ECmLineBreakClass }, //telugu vowel sign o
+ { 0x0c55, 0x0c57, MLineBreaker::ECmLineBreakClass }, //telugu length mark
+ { 0x0c60, 0x0c62, MLineBreaker::EAlLineBreakClass }, //telugu letter vocalic rr
+ { 0x0c66, 0x0c70, MLineBreaker::ENuLineBreakClass }, //telugu digit zero
+ { 0x0c82, 0x0c84, MLineBreaker::ECmLineBreakClass }, //kannada sign anusvara
+ { 0x0c85, 0x0c8d, MLineBreaker::EAlLineBreakClass }, //kannada letter a
+ { 0x0c8e, 0x0c91, MLineBreaker::EAlLineBreakClass }, //kannada letter e
+ { 0x0c92, 0x0ca9, MLineBreaker::EAlLineBreakClass }, //kannada letter o
+ { 0x0caa, 0x0cb4, MLineBreaker::EAlLineBreakClass }, //kannada letter pa
+ { 0x0cb5, 0x0cba, MLineBreaker::EAlLineBreakClass }, //kannada letter va
+ { 0x0cbc, 0x0cbd, MLineBreaker::ECmLineBreakClass }, //kannada sign nukta: CR1080
+ { 0x0cbd, 0x0cbe, MLineBreaker::EAlLineBreakClass }, //kannada sign avagraha: CR1080
+ { 0x0cbe, 0x0cc5, MLineBreaker::ECmLineBreakClass }, //kannada vowel sign aa
+ { 0x0cc6, 0x0cc9, MLineBreaker::ECmLineBreakClass }, //kannada vowel sign e
+ { 0x0cca, 0x0cce, MLineBreaker::ECmLineBreakClass }, //kannada vowel sign o
+ { 0x0cd5, 0x0cd7, MLineBreaker::ECmLineBreakClass }, //kannada length mark
+ { 0x0cde, 0x0cdf, MLineBreaker::EAlLineBreakClass }, //kannada letter fa
+ { 0x0ce0, 0x0ce2, MLineBreaker::EAlLineBreakClass }, //kannada letter vocalic rr
+ { 0x0ce2, 0x0ce4, MLineBreaker::ECmLineBreakClass }, //kannada vowel sign vocalic l: CR1080
+ { 0x0ce6, 0x0cf0, MLineBreaker::ENuLineBreakClass }, //kannada digit zero
+ { 0x0cf1, 0x0cf3, MLineBreaker::EAlLineBreakClass }, //kannada sign jihvamuliya: CR1080
+ { 0x0d02, 0x0d04, MLineBreaker::ECmLineBreakClass }, //malayalam sign anusvara
+ { 0x0d05, 0x0d0d, MLineBreaker::EAlLineBreakClass }, //malayalam letter a
+ { 0x0d0e, 0x0d11, MLineBreaker::EAlLineBreakClass }, //malayalam letter e
+ { 0x0d12, 0x0d29, MLineBreaker::EAlLineBreakClass }, //malayalam letter o
+ { 0x0d2a, 0x0d3a, MLineBreaker::EAlLineBreakClass }, //malayalam letter pa
+ { 0x0d3e, 0x0d44, MLineBreaker::ECmLineBreakClass }, //malayalam vowel sign aa
+ { 0x0d46, 0x0d49, MLineBreaker::ECmLineBreakClass }, //malayalam vowel sign e
+ { 0x0d4a, 0x0d4e, MLineBreaker::ECmLineBreakClass }, //malayalam vowel sign o
+ { 0x0d57, 0x0d58, MLineBreaker::ECmLineBreakClass }, //malayalam au length mark
+ { 0x0d60, 0x0d62, MLineBreaker::EAlLineBreakClass }, //malayalam letter vocalic rr
+ { 0x0d66, 0x0d70, MLineBreaker::ENuLineBreakClass }, //malayalam digit zero
+ { 0x0d82, 0x0d84, MLineBreaker::ECmLineBreakClass }, //sinhala sign anusvaraya
+ { 0x0d85, 0x0d97, MLineBreaker::EAlLineBreakClass }, //sinhala letter ayanna
+ { 0x0d9a, 0x0db2, MLineBreaker::EAlLineBreakClass }, //sinhala letter alpapraana kayanna
+ { 0x0db3, 0x0dbc, MLineBreaker::EAlLineBreakClass }, //sinhala letter sanyaka dayanna
+ { 0x0dbd, 0x0dbe, MLineBreaker::EAlLineBreakClass }, //sinhala letter dantaja layanna
+ { 0x0dc0, 0x0dc7, MLineBreaker::EAlLineBreakClass }, //sinhala letter vayanna
+ { 0x0dca, 0x0dcb, MLineBreaker::ECmLineBreakClass }, //sinhala sign al-lakuna
+ { 0x0dcf, 0x0dd5, MLineBreaker::ECmLineBreakClass }, //sinhala vowel sign aela-pilla
+ { 0x0dd6, 0x0dd7, MLineBreaker::ECmLineBreakClass }, //sinhala vowel sign diga paa-pilla
+ { 0x0dd8, 0x0de0, MLineBreaker::ECmLineBreakClass }, //sinhala vowel sign gaetta-pilla
+ { 0x0df2, 0x0df4, MLineBreaker::ECmLineBreakClass }, //sinhala vowel sign diga gaetta-pilla
+ { 0x0df4, 0x0df5, MLineBreaker::EAlLineBreakClass }, //sinhala punctuation kunddaliya
+ { 0x0e01, 0x0e31, MLineBreaker::ESaLineBreakClass }, //thai character ko kai
+ { 0x0e31, 0x0e32, MLineBreaker::ECmLineBreakClass }, //thai character mai han-akat
+ { 0x0e32, 0x0e34, MLineBreaker::ESaLineBreakClass }, //thai character sara aa
+ { 0x0e34, 0x0e3b, MLineBreaker::ECmLineBreakClass }, //thai character sara i
+ { 0x0e3f, 0x0e40, MLineBreaker::EPrLineBreakClass }, //thai currency symbol baht
+ { 0x0e40, 0x0e47, MLineBreaker::ESaLineBreakClass }, //thai character sara e
+ { 0x0e47, 0x0e4f, MLineBreaker::ECmLineBreakClass }, //thai character maitaikhu
+ { 0x0e4f, 0x0e50, MLineBreaker::EAlLineBreakClass }, //thai character fongman
+ { 0x0e50, 0x0e5a, MLineBreaker::ENuLineBreakClass }, //thai digit zero
+ { 0x0e5a, 0x0e5c, MLineBreaker::ENsLineBreakClass }, //thai character angkhankhu
+ { 0x0e81, 0x0e83, MLineBreaker::ESaLineBreakClass }, //lao letter ko
+ { 0x0e84, 0x0e85, MLineBreaker::ESaLineBreakClass }, //lao letter kho tam
+ { 0x0e87, 0x0e89, MLineBreaker::ESaLineBreakClass }, //lao letter ngo
+ { 0x0e8a, 0x0e8b, MLineBreaker::ESaLineBreakClass }, //lao letter so tam
+ { 0x0e8d, 0x0e8e, MLineBreaker::ESaLineBreakClass }, //lao letter nyo
+ { 0x0e94, 0x0e98, MLineBreaker::ESaLineBreakClass }, //lao letter do
+ { 0x0e99, 0x0ea0, MLineBreaker::ESaLineBreakClass }, //lao letter no
+ { 0x0ea1, 0x0ea4, MLineBreaker::ESaLineBreakClass }, //lao letter mo
+ { 0x0ea5, 0x0ea6, MLineBreaker::ESaLineBreakClass }, //lao letter lo loot
+ { 0x0ea7, 0x0ea8, MLineBreaker::ESaLineBreakClass }, //lao letter wo
+ { 0x0eaa, 0x0eac, MLineBreaker::ESaLineBreakClass }, //lao letter so sung
+ { 0x0ead, 0x0eb1, MLineBreaker::ESaLineBreakClass }, //lao letter o
+ { 0x0eb1, 0x0eb2, MLineBreaker::ECmLineBreakClass }, //lao vowel sign mai kan
+ { 0x0eb2, 0x0eb4, MLineBreaker::ESaLineBreakClass }, //lao vowel sign aa
+ { 0x0eb4, 0x0eba, MLineBreaker::ECmLineBreakClass }, //lao vowel sign i
+ { 0x0ebb, 0x0ebd, MLineBreaker::ECmLineBreakClass }, //lao vowel sign mai kon
+ { 0x0ebd, 0x0ebe, MLineBreaker::ESaLineBreakClass }, //lao semivowel sign nyo
+ { 0x0ec0, 0x0ec5, MLineBreaker::ESaLineBreakClass }, //lao vowel sign e
+ { 0x0ec6, 0x0ec7, MLineBreaker::ESaLineBreakClass }, //lao ko la
+ { 0x0ec8, 0x0ece, MLineBreaker::ECmLineBreakClass }, //lao tone mai ek
+ { 0x0ed0, 0x0eda, MLineBreaker::ENuLineBreakClass }, //lao digit zero
+ { 0x0edc, 0x0ede, MLineBreaker::ESaLineBreakClass }, //lao ho no
+ { 0x0f00, 0x0f0b, MLineBreaker::EAlLineBreakClass }, //tibetan syllable om
+ { 0x0f0b, 0x0f0c, MLineBreaker::EBaLineBreakClass }, //tibetan mark intersyllabic tsheg
+ { 0x0f0c, 0x0f0d, MLineBreaker::EGlLineBreakClass }, //tibetan mark delimiter tsheg bstar
+ { 0x0f0d, 0x0f18, MLineBreaker::EAlLineBreakClass }, //tibetan mark shad
+ { 0x0f18, 0x0f1a, MLineBreaker::ECmLineBreakClass }, //tibetan astrological sign -khyud pa
+ { 0x0f1a, 0x0f20, MLineBreaker::EAlLineBreakClass }, //tibetan sign rdel dkar gcig
+ { 0x0f20, 0x0f2a, MLineBreaker::ENuLineBreakClass }, //tibetan digit zero
+ { 0x0f2a, 0x0f35, MLineBreaker::EAlLineBreakClass }, //tibetan digit half one
+ { 0x0f35, 0x0f36, MLineBreaker::ECmLineBreakClass }, //tibetan mark ngas bzung nyi zla
+ { 0x0f36, 0x0f37, MLineBreaker::EAlLineBreakClass }, //tibetan mark caret -dzud rtags bzhi mig can
+ { 0x0f37, 0x0f38, MLineBreaker::ECmLineBreakClass }, //tibetan mark ngas bzung sgor rtags
+ { 0x0f38, 0x0f39, MLineBreaker::EAlLineBreakClass }, //tibetan mark che mgo
+ { 0x0f39, 0x0f3a, MLineBreaker::ECmLineBreakClass }, //tibetan mark tsa -phru
+ { 0x0f3a, 0x0f3b, MLineBreaker::EOpLineBreakClass }, //tibetan mark gug rtags gyon
+ { 0x0f3b, 0x0f3c, MLineBreaker::EClLineBreakClass }, //tibetan mark gug rtags gyas
+ { 0x0f3c, 0x0f3d, MLineBreaker::EOpLineBreakClass }, //tibetan mark ang khang gyon
+ { 0x0f3d, 0x0f3e, MLineBreaker::EClLineBreakClass }, //tibetan mark ang khang gyas
+ { 0x0f3e, 0x0f40, MLineBreaker::ECmLineBreakClass }, //tibetan sign yar tshes
+ { 0x0f40, 0x0f48, MLineBreaker::EAlLineBreakClass }, //tibetan letter ka
+ { 0x0f49, 0x0f6b, MLineBreaker::EAlLineBreakClass }, //tibetan letter nya
+ { 0x0f71, 0x0f85, MLineBreaker::ECmLineBreakClass }, //tibetan vowel sign aa
+ { 0x0f85, 0x0f86, MLineBreaker::EAlLineBreakClass }, //tibetan mark paluta
+ { 0x0f86, 0x0f88, MLineBreaker::ECmLineBreakClass }, //tibetan sign lci rtags
+ { 0x0f88, 0x0f8c, MLineBreaker::EAlLineBreakClass }, //tibetan sign lce tsa can
+ { 0x0f90, 0x0f98, MLineBreaker::ECmLineBreakClass }, //tibetan subjoined letter ka
+ { 0x0f99, 0x0fbd, MLineBreaker::ECmLineBreakClass }, //tibetan subjoined letter nya
+ { 0x0fbe, 0x0fc6, MLineBreaker::EAlLineBreakClass }, //tibetan ku ru kha
+ { 0x0fc6, 0x0fc7, MLineBreaker::ECmLineBreakClass }, //tibetan symbol padma gdan
+ { 0x0fc7, 0x0fcd, MLineBreaker::EAlLineBreakClass }, //tibetan symbol rdo rje rgya gram
+ { 0x0fcf, 0x0fd0, MLineBreaker::EAlLineBreakClass }, //tibetan sign rdel nag gsum
+ { 0x0fd0, 0x0fd2, MLineBreaker::EBbLineBreakClass }, //TIBETAN MARK BSKA- SHOG GI MGO RGYAN
+ { 0x1000, 0x1022, MLineBreaker::ESaLineBreakClass }, //myanmar letter ka
+ { 0x1023, 0x1028, MLineBreaker::ESaLineBreakClass }, //myanmar letter i
+ { 0x1029, 0x102b, MLineBreaker::ESaLineBreakClass }, //myanmar letter o
+ { 0x102c, 0x1033, MLineBreaker::ECmLineBreakClass }, //myanmar vowel sign aa
+ { 0x1036, 0x103a, MLineBreaker::ECmLineBreakClass }, //myanmar sign anusvara
+ { 0x1040, 0x104a, MLineBreaker::ENuLineBreakClass }, //myanmar digit zero
+ { 0x104a, 0x1050, MLineBreaker::EAlLineBreakClass }, //myanmar sign little section
+ { 0x1050, 0x1056, MLineBreaker::ESaLineBreakClass }, //myanmar letter sha
+ { 0x1056, 0x105a, MLineBreaker::ECmLineBreakClass }, //myanmar vowel sign vocalic r
+ { 0x10a0, 0x10c6, MLineBreaker::EAlLineBreakClass }, //georgian capital letter an
+ { 0x10d0, 0x10fb, MLineBreaker::EAlLineBreakClass }, //georgian letter an
+ { 0x10fb, 0x10fc, MLineBreaker::EAlLineBreakClass }, //georgian paragraph separator
+ { 0x10fc, 0x10fd, MLineBreaker::EAlLineBreakClass }, //MODIFIER LETTER GEORGIAN NAR
+ { 0x1100, 0x115a, MLineBreaker::EIdLineBreakClass }, //hangul choseong kiyeok
+ { 0x115f, 0x1160, MLineBreaker::EIdLineBreakClass }, //hangul choseong filler
+ { 0x1160, 0x11a3, MLineBreaker::ECmLineBreakClass }, //hangul jungseong filler
+ { 0x11a8, 0x11fa, MLineBreaker::ECmLineBreakClass }, //hangul jongseong kiyeok
+ { 0x1200, 0x1248, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable ha
+ { 0x1248, 0x1249, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable qwa
+ { 0x124a, 0x124e, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable qwi
+ { 0x1250, 0x1257, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable qha
+ { 0x1258, 0x1259, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable qhwa
+ { 0x125a, 0x125e, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable qhwi
+ { 0x1260, 0x1288, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable ba
+ { 0x1288, 0x1289, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable xwa
+ { 0x128a, 0x128e, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable xwi
+ { 0x1290, 0x12b0, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable na
+ { 0x12b0, 0x12b1, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable kwa
+ { 0x12b2, 0x12b6, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable kwi
+ { 0x12b8, 0x12bf, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable kxa
+ { 0x12c0, 0x12c1, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable kxwa
+ { 0x12c2, 0x12c6, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable kxwi
+ { 0x12c8, 0x12d7, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable wa
+ { 0x12d8, 0x1310, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable za
+ { 0x1310, 0x1311, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable gwa
+ { 0x1312, 0x1316, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable gwi
+ { 0x1318, 0x135b, MLineBreaker::EAlLineBreakClass }, //ethiopic syllable gga
+ { 0x135f, 0x1360, MLineBreaker::ECmLineBreakClass }, //ETHIOPIC COMBINING GEMINATION MARK
+ { 0x1360, 0x1361, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SECTION MARK
+ { 0x1361, 0x1362, MLineBreaker::EBaLineBreakClass }, //ethiopic wordspace
+ { 0x1362, 0x1369, MLineBreaker::EAlLineBreakClass }, //ethiopic full stop
+ { 0x1369, 0x1372, MLineBreaker::ENuLineBreakClass }, //ethiopic digit one
+ { 0x1372, 0x137d, MLineBreaker::EAlLineBreakClass }, //ethiopic number ten
+ { 0x1380, 0x139a, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE SEBATBEIT MWA
+ { 0x13a0, 0x13f5, MLineBreaker::EAlLineBreakClass }, //cherokee letter a
+ { 0x1401, 0x1677, MLineBreaker::EAlLineBreakClass }, //canadian syllabics e
+ { 0x1680, 0x1681, MLineBreaker::EBaLineBreakClass }, //ogham space mark
+ { 0x1681, 0x169b, MLineBreaker::EAlLineBreakClass }, //ogham letter beith
+ { 0x169b, 0x169c, MLineBreaker::EOpLineBreakClass }, //ogham feather mark
+ { 0x169c, 0x169d, MLineBreaker::EClLineBreakClass }, //ogham reversed feather mark
+ { 0x16a0, 0x16f1, MLineBreaker::EAlLineBreakClass }, //runic letter fehu feoh fe f
+ { 0x1700, 0x170d, MLineBreaker::EAlLineBreakClass }, //TAGALOG LETTER A
+ { 0x170e, 0x1712, MLineBreaker::EAlLineBreakClass }, //TAGALOG LETTER LA
+ { 0x1712, 0x1715, MLineBreaker::ECmLineBreakClass }, //TAGALOG VOWEL SIGN I
+ { 0x1720, 0x1732, MLineBreaker::EAlLineBreakClass }, //HANUNOO LETTER A
+ { 0x1732, 0x1735, MLineBreaker::ECmLineBreakClass }, //HANUNOO VOWEL SIGN I
+ { 0x1735, 0x1737, MLineBreaker::EBaLineBreakClass }, //PHILIPPINE SINGLE PUNCTUATION
+ { 0x1740, 0x1752, MLineBreaker::EAlLineBreakClass }, //BUHID LETTER A
+ { 0x1752, 0x1754, MLineBreaker::ECmLineBreakClass }, //BUHID VOWEL SIGN I
+ { 0x1760, 0x176d, MLineBreaker::EAlLineBreakClass }, //TAGBANWA LETTER A
+ { 0x176e, 0x1771, MLineBreaker::EAlLineBreakClass }, //TAGBANWA LETTER LA
+ { 0x1772, 0x1774, MLineBreaker::ECmLineBreakClass }, //TAGBANWA VOWEL SIGN I
+ { 0x1780, 0x17b4, MLineBreaker::ESaLineBreakClass }, //khmer letter ka
+ { 0x17b4, 0x17d4, MLineBreaker::ECmLineBreakClass }, //khmer vowel inherent aq
+ { 0x17d4, 0x17d5, MLineBreaker::ENsLineBreakClass }, //khmer sign khan
+ { 0x17d5, 0x17d6, MLineBreaker::EBaLineBreakClass }, //khmer sign bariyoosan
+ { 0x17d6, 0x17db, MLineBreaker::ENsLineBreakClass }, //khmer sign camnuc pii kuuh
+ { 0x17db, 0x17dc, MLineBreaker::EPrLineBreakClass }, //khmer currency symbol riel
+ { 0x17dc, 0x17dd, MLineBreaker::EAlLineBreakClass }, //khmer sign avakrahasanya
+ { 0x17dd, 0x17de, MLineBreaker::ESaLineBreakClass }, //KHMER SIGN ATTHACAN
+ { 0x17e0, 0x17ea, MLineBreaker::ENuLineBreakClass }, //khmer digit zero
+ { 0x17f0, 0x17fa, MLineBreaker::EAlLineBreakClass }, //KHMER SYMBOL LEK ATTAK SON
+ { 0x1800, 0x1806, MLineBreaker::EAlLineBreakClass }, //mongolian birga
+ { 0x1806, 0x1807, MLineBreaker::EBbLineBreakClass }, //mongolian todo soft hyphen
+ { 0x1807, 0x180b, MLineBreaker::EAlLineBreakClass }, //mongolian sibe syllable boundary marker
+ { 0x180b, 0x180f, MLineBreaker::ECmLineBreakClass }, //mongolian free variation selector one
+ { 0x1810, 0x181a, MLineBreaker::ENuLineBreakClass }, //mongolian digit zero
+ { 0x1820, 0x1878, MLineBreaker::EAlLineBreakClass }, //mongolian letter a
+ { 0x1880, 0x18a9, MLineBreaker::EAlLineBreakClass }, //mongolian letter ali gali anusvara one
+ { 0x18a9, 0x18aa, MLineBreaker::ECmLineBreakClass }, //mongolian letter ali gali dagalga
+ { 0x1900, 0x191d, MLineBreaker::EAlLineBreakClass }, //LIMBU VOWEL-CARRIER LETTER
+ { 0x1920, 0x192c, MLineBreaker::ECmLineBreakClass }, //LIMBU VOWEL SIGN A
+ { 0x1930, 0x193c, MLineBreaker::ECmLineBreakClass }, //LIMBU SMALL LETTER KA
+ { 0x1940, 0x1941, MLineBreaker::EAlLineBreakClass }, //LIMBU SIGN LOO
+ { 0x1944, 0x1946, MLineBreaker::EExLineBreakClass }, //LIMBU EXCLAMATION MARK
+ { 0x1946, 0x1950, MLineBreaker::ENuLineBreakClass }, //LIMBU DIGIT ZERO
+ { 0x1950, 0x196e, MLineBreaker::ESaLineBreakClass }, //TAI LE LETTER KA
+ { 0x1970, 0x1975, MLineBreaker::ESaLineBreakClass }, //TAI LE LETTER TONE-2
+ { 0x1980, 0x19aa, MLineBreaker::ESaLineBreakClass }, //NEW TAI LUE LETTER HIGH QA
+ { 0x19b0, 0x19ca, MLineBreaker::ESaLineBreakClass }, //NEW TAI LUE VOWEL SIGN VOWEL SHORTENER
+ { 0x19d0, 0x19da, MLineBreaker::ENuLineBreakClass }, //NEW TAI LUE DIGIT ZERO
+ { 0x19de, 0x19e0, MLineBreaker::ESaLineBreakClass }, //NEW TAI LUE SIGN LAE
+ { 0x19e0, 0x1a17, MLineBreaker::EAlLineBreakClass }, //KHMER SYMBOL PATHAMASAT
+ { 0x1a17, 0x1a1c, MLineBreaker::ECmLineBreakClass }, //BUGINESE VOWEL SIGN I
+ { 0x1a1e, 0x1a1f, MLineBreaker::EBaLineBreakClass }, //BUGINESE PALLAWA
+ { 0x1a1f, 0x1a20, MLineBreaker::EAlLineBreakClass }, //BUGINESE END OF SECTION
+ { 0x1b00, 0x1b05, MLineBreaker::ECmLineBreakClass }, //BALINESE SIGN ULU RICEM
+ { 0x1b05, 0x1b34, MLineBreaker::EAlLineBreakClass }, //BALINESE LETTER AKARA
+ { 0x1b34, 0x1b45, MLineBreaker::ECmLineBreakClass }, //BALINESE SIGN REREKAN
+ { 0x1b45, 0x1b4c, MLineBreaker::EAlLineBreakClass }, //BALINESE LETTER KAF SASAK
+ { 0x1b50, 0x1b5a, MLineBreaker::ENuLineBreakClass }, //BALINESE DIGIT ZERO
+ { 0x1b5a, 0x1b61, MLineBreaker::EBaLineBreakClass }, //BALINESE PANTI
+ { 0x1b61, 0x1b6b, MLineBreaker::EAlLineBreakClass }, //BALINESE MUSICAL SYMBOL DONG
+ { 0x1b6b, 0x1b74, MLineBreaker::ECmLineBreakClass }, //BALINESE MUSICAL SYMBOL COMBINING TEGEH
+ { 0x1b74, 0x1b7d, MLineBreaker::EAlLineBreakClass }, //BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG
+ { 0x1d00, 0x1dc0, MLineBreaker::EAlLineBreakClass }, //LATIN LETTER SMALL CAPITAL A
+ { 0x1dc0, 0x1dcb, MLineBreaker::ECmLineBreakClass }, //COMBINING DOTTED GRAVE ACCENT
+ { 0x1dfe, 0x1e00, MLineBreaker::ECmLineBreakClass }, //COMBINING LEFT ARROWHEAD ABOVE
+ { 0x1e00, 0x1e9c, MLineBreaker::EAlLineBreakClass }, //latin capital letter a with ring below
+ { 0x1ea0, 0x1efa, MLineBreaker::EAlLineBreakClass }, //latin capital letter a with dot below
+ { 0x1f00, 0x1f16, MLineBreaker::EAlLineBreakClass }, //greek small letter alpha with psili
+ { 0x1f18, 0x1f1e, MLineBreaker::EAlLineBreakClass }, //greek capital letter epsilon with psili
+ { 0x1f20, 0x1f46, MLineBreaker::EAlLineBreakClass }, //greek small letter eta with psili
+ { 0x1f48, 0x1f4e, MLineBreaker::EAlLineBreakClass }, //greek capital letter omicron with psili
+ { 0x1f50, 0x1f58, MLineBreaker::EAlLineBreakClass }, //greek small letter upsilon with psili
+ { 0x1f59, 0x1f5a, MLineBreaker::EAlLineBreakClass }, //greek capital letter upsilon with dasia
+ { 0x1f5b, 0x1f5c, MLineBreaker::EAlLineBreakClass }, //greek capital letter upsilon with dasia and varia
+ { 0x1f5d, 0x1f5e, MLineBreaker::EAlLineBreakClass }, //greek capital letter upsilon with dasia and oxia
+ { 0x1f5f, 0x1f7e, MLineBreaker::EAlLineBreakClass }, //greek capital letter upsilon with dasia and perispomeni
+ { 0x1f80, 0x1fb5, MLineBreaker::EAlLineBreakClass }, //greek small letter alpha with psili and ypogegrammeni
+ { 0x1fb6, 0x1fc5, MLineBreaker::EAlLineBreakClass }, //greek small letter alpha with perispomeni
+ { 0x1fc6, 0x1fd4, MLineBreaker::EAlLineBreakClass }, //greek small letter eta with perispomeni
+ { 0x1fd6, 0x1fdc, MLineBreaker::EAlLineBreakClass }, //greek small letter iota with perispomeni
+ { 0x1fdd, 0x1ff0, MLineBreaker::EAlLineBreakClass }, //greek dasia and varia
+ { 0x1ff2, 0x1ff5, MLineBreaker::EAlLineBreakClass }, //greek small letter omega with varia and ypogegrammeni
+ { 0x1ff6, 0x1fff, MLineBreaker::EAlLineBreakClass }, //greek small letter omega with perispomeni
+ { 0x2000, 0x2007, MLineBreaker::EBaLineBreakClass }, //en quad
+ { 0x2007, 0x2008, MLineBreaker::EGlLineBreakClass }, //figure space
+ { 0x2008, 0x200b, MLineBreaker::EBaLineBreakClass }, //punctuation space
+ { 0x200b, 0x200c, MLineBreaker::EZwLineBreakClass }, //zero width space
+ { 0x200c, 0x2010, MLineBreaker::ECmLineBreakClass }, //zero width non-joiner
+ { 0x2010, 0x2011, MLineBreaker::EBaLineBreakClass }, //hyphen
+ { 0x2011, 0x2012, MLineBreaker::EGlLineBreakClass }, //non-breaking hyphen
+ { 0x2012, 0x2014, MLineBreaker::EBaLineBreakClass }, //figure dash
+ { 0x2014, 0x2015, MLineBreaker::EB2LineBreakClass }, //em dash
+ { 0x2015, 0x2016, MLineBreaker::EAlLineBreakClass }, //horizontal bar
+ { 0x2016, 0x2017, MLineBreaker::EAiLineBreakClass }, //double vertical line
+ { 0x2017, 0x2018, MLineBreaker::EAlLineBreakClass }, //double low line
+ { 0x2018, 0x201a, MLineBreaker::EQuLineBreakClass }, //left single quotation mark
+ { 0x201a, 0x201b, MLineBreaker::EOpLineBreakClass }, //single low-9 quotation mark
+ { 0x201b, 0x201e, MLineBreaker::EQuLineBreakClass }, //single high-reversed-9 quotation mark
+ { 0x201e, 0x201f, MLineBreaker::EOpLineBreakClass }, //double low-9 quotation mark
+ { 0x201f, 0x2020, MLineBreaker::EQuLineBreakClass }, //double high-reversed-9 quotation mark
+ { 0x2020, 0x2022, MLineBreaker::EAiLineBreakClass }, //dagger
+ { 0x2022, 0x2024, MLineBreaker::EAlLineBreakClass }, //bullet
+ { 0x2024, 0x2027, MLineBreaker::EInLineBreakClass }, //one dot leader
+ { 0x2027, 0x2028, MLineBreaker::EBaLineBreakClass }, //hyphenation point
+ { 0x2028, 0x202a, MLineBreaker::EBkLineBreakClass }, //line separator
+ { 0x202a, 0x202f, MLineBreaker::ECmLineBreakClass }, //left-to-right embedding
+ { 0x202f, 0x2030, MLineBreaker::EGlLineBreakClass }, //narrow no-break space
+ { 0x2030, 0x2038, MLineBreaker::EPoLineBreakClass }, //per mille sign
+ { 0x2038, 0x2039, MLineBreaker::EAlLineBreakClass }, //caret
+ { 0x2039, 0x203b, MLineBreaker::EQuLineBreakClass }, //single left-pointing angle quotation mark
+ { 0x203b, 0x203c, MLineBreaker::EAiLineBreakClass }, //reference mark
+ { 0x203c, 0x203d, MLineBreaker::ENsLineBreakClass }, //double exclamation mark
+ { 0x203d, 0x2044, MLineBreaker::EAlLineBreakClass }, //interrobang
+ { 0x2044, 0x2045, MLineBreaker::ENsLineBreakClass }, //fraction slash
+ { 0x2045, 0x2046, MLineBreaker::EOpLineBreakClass }, //left square bracket with quill
+ { 0x2046, 0x2047, MLineBreaker::EClLineBreakClass }, //right square bracket with quill
+ { 0x2047, 0x2048, MLineBreaker::ENsLineBreakClass }, //DOUBLE QUESTION MARK
+ { 0x2048, 0x2056, MLineBreaker::EAlLineBreakClass }, //question exclamation mark
+ { 0x2056, 0x2057, MLineBreaker::EBaLineBreakClass }, //THREE DOT PUNCTUATION
+ { 0x2057, 0x2058, MLineBreaker::EAlLineBreakClass }, //QUADRUPLE PRIME
+ { 0x2058, 0x205c, MLineBreaker::EBaLineBreakClass }, //FOUR DOT PUNCTUATION
+ { 0x205c, 0x205d, MLineBreaker::EAlLineBreakClass }, //DOTTED CROSS
+ { 0x205d, 0x2060, MLineBreaker::EBaLineBreakClass }, //TRICOLON
+ { 0x2060, 0x2061, MLineBreaker::EGlLineBreakClass }, //WORD JOINER
+ { 0x2061, 0x2064, MLineBreaker::EAlLineBreakClass }, //FUNCTION APPLICATION
+ { 0x206a, 0x2070, MLineBreaker::ECmLineBreakClass }, //inhibit symmetric swapping
+ { 0x2070, 0x2071, MLineBreaker::EAlLineBreakClass }, //superscript zero
+ { 0x2071, 0x2072, MLineBreaker::EAlLineBreakClass }, //SUPERSCRIPT LATIN SMALL LETTER I
+ { 0x2074, 0x2075, MLineBreaker::EAiLineBreakClass }, //superscript four
+ { 0x2075, 0x207d, MLineBreaker::EAlLineBreakClass }, //superscript five
+ { 0x207d, 0x207e, MLineBreaker::EOpLineBreakClass }, //superscript left parenthesis
+ { 0x207e, 0x207f, MLineBreaker::EClLineBreakClass }, //superscript right parenthesis
+ { 0x207f, 0x2080, MLineBreaker::EAiLineBreakClass }, //superscript latin small letter n
+ { 0x2080, 0x2081, MLineBreaker::EAlLineBreakClass }, //subscript zero
+ { 0x2081, 0x2085, MLineBreaker::EAiLineBreakClass }, //subscript one
+ { 0x2085, 0x208d, MLineBreaker::EAlLineBreakClass }, //subscript five
+ { 0x208d, 0x208e, MLineBreaker::EOpLineBreakClass }, //subscript left parenthesis
+ { 0x208e, 0x208f, MLineBreaker::EClLineBreakClass }, //subscript right parenthesis
+ { 0x2090, 0x2095, MLineBreaker::EAlLineBreakClass }, //LATIN SUBSCRIPT SMALL LETTER A
+ { 0x20a0, 0x20a7, MLineBreaker::EPrLineBreakClass }, //euro-currency sign
+ { 0x20a7, 0x20a8, MLineBreaker::EPoLineBreakClass }, //peseta sign
+ { 0x20a8, 0x20b6, MLineBreaker::EPrLineBreakClass }, //rupee sign
+ { 0x20d0, 0x20f0, MLineBreaker::ECmLineBreakClass }, //combining left harpoon above
+ { 0x2100, 0x2103, MLineBreaker::EAlLineBreakClass }, //account of
+ { 0x2103, 0x2104, MLineBreaker::EPoLineBreakClass }, //degree celsius
+ { 0x2104, 0x2105, MLineBreaker::EAlLineBreakClass }, //centre line symbol
+ { 0x2105, 0x2106, MLineBreaker::EAiLineBreakClass }, //care of
+ { 0x2106, 0x2109, MLineBreaker::EAlLineBreakClass }, //cada una
+ { 0x2109, 0x210a, MLineBreaker::EPoLineBreakClass }, //degree fahrenheit
+ { 0x210a, 0x2113, MLineBreaker::EAlLineBreakClass }, //script small g
+ { 0x2113, 0x2114, MLineBreaker::EAiLineBreakClass }, //script small l
+ { 0x2114, 0x2116, MLineBreaker::EAlLineBreakClass }, //l b bar symbol
+ { 0x2116, 0x2117, MLineBreaker::EPrLineBreakClass }, //numero sign
+ { 0x2117, 0x2121, MLineBreaker::EAlLineBreakClass }, //sound recording copyright
+ { 0x2121, 0x2123, MLineBreaker::EAiLineBreakClass }, //telephone sign
+ { 0x2123, 0x2126, MLineBreaker::EAlLineBreakClass }, //versicle
+ { 0x2126, 0x2127, MLineBreaker::EPoLineBreakClass }, //ohm sign
+ { 0x2127, 0x212b, MLineBreaker::EAlLineBreakClass }, //inverted ohm sign
+ { 0x212b, 0x212c, MLineBreaker::EAiLineBreakClass }, //angstrom sign
+ { 0x212c, 0x214f, MLineBreaker::EAlLineBreakClass }, //script capital b
+ { 0x2153, 0x2154, MLineBreaker::EAlLineBreakClass }, //vulgar fraction one third
+ { 0x2154, 0x2156, MLineBreaker::EAiLineBreakClass }, //vulgar fraction two thirds
+ { 0x2156, 0x215b, MLineBreaker::EAlLineBreakClass }, //vulgar fraction two fifths
+ { 0x215b, 0x215c, MLineBreaker::EAiLineBreakClass }, //vulgar fraction one eighth
+ { 0x215c, 0x215e, MLineBreaker::EAlLineBreakClass }, //vulgar fraction three eighths
+ { 0x215e, 0x215f, MLineBreaker::EAiLineBreakClass }, //vulgar fraction seven eighths
+ { 0x215f, 0x2160, MLineBreaker::EAlLineBreakClass }, //fraction numerator one
+ { 0x2160, 0x216c, MLineBreaker::EAiLineBreakClass }, //roman numeral one
+ { 0x216c, 0x2170, MLineBreaker::EAlLineBreakClass }, //roman numeral fifty
+ { 0x2170, 0x217a, MLineBreaker::EAiLineBreakClass }, //small roman numeral one
+ { 0x217a, 0x2185, MLineBreaker::EAlLineBreakClass }, //small roman numeral eleven
+ { 0x2190, 0x219a, MLineBreaker::EAiLineBreakClass }, //leftwards arrow
+ { 0x219a, 0x21d2, MLineBreaker::EAlLineBreakClass }, //leftwards arrow with stroke
+ { 0x21d2, 0x21d3, MLineBreaker::EAiLineBreakClass }, //rightwards double arrow
+ { 0x21d3, 0x21d4, MLineBreaker::EAlLineBreakClass }, //downwards double arrow
+ { 0x21d4, 0x21d5, MLineBreaker::EAiLineBreakClass }, //left right double arrow
+ { 0x21d5, 0x2200, MLineBreaker::EAlLineBreakClass }, //up down double arrow
+ { 0x2200, 0x2201, MLineBreaker::EAiLineBreakClass }, //for all
+ { 0x2201, 0x2202, MLineBreaker::EAlLineBreakClass }, //complement
+ { 0x2202, 0x2204, MLineBreaker::EAiLineBreakClass }, //partial differential
+ { 0x2204, 0x2207, MLineBreaker::EAlLineBreakClass }, //there does not exist
+ { 0x2207, 0x2209, MLineBreaker::EAiLineBreakClass }, //nabla
+ { 0x2209, 0x220b, MLineBreaker::EAlLineBreakClass }, //not an element of
+ { 0x220b, 0x220c, MLineBreaker::EAiLineBreakClass }, //contains as member
+ { 0x220c, 0x220f, MLineBreaker::EAlLineBreakClass }, //does not contain as member
+ { 0x220f, 0x2210, MLineBreaker::EAiLineBreakClass }, //n-ary product
+ { 0x2210, 0x2211, MLineBreaker::EAlLineBreakClass }, //n-ary coproduct
+ { 0x2211, 0x2212, MLineBreaker::EAiLineBreakClass }, //n-ary summation
+ { 0x2212, 0x2214, MLineBreaker::EPrLineBreakClass }, //minus sign
+ { 0x2214, 0x2215, MLineBreaker::EAlLineBreakClass }, //dot plus
+ { 0x2215, 0x2216, MLineBreaker::EAiLineBreakClass }, //division slash
+ { 0x2216, 0x221a, MLineBreaker::EAlLineBreakClass }, //set minus
+ { 0x221a, 0x221b, MLineBreaker::EAiLineBreakClass }, //square root
+ { 0x221b, 0x221d, MLineBreaker::EAlLineBreakClass }, //cube root
+ { 0x221d, 0x2221, MLineBreaker::EAiLineBreakClass }, //proportional to
+ { 0x2221, 0x2223, MLineBreaker::EAlLineBreakClass }, //measured angle
+ { 0x2223, 0x2224, MLineBreaker::EAiLineBreakClass }, //divides
+ { 0x2224, 0x2225, MLineBreaker::EAlLineBreakClass }, //does not divide
+ { 0x2225, 0x2226, MLineBreaker::EAiLineBreakClass }, //parallel to
+ { 0x2226, 0x2227, MLineBreaker::EAlLineBreakClass }, //not parallel to
+ { 0x2227, 0x222d, MLineBreaker::EAiLineBreakClass }, //logical and
+ { 0x222d, 0x222e, MLineBreaker::EAlLineBreakClass }, //triple integral
+ { 0x222e, 0x222f, MLineBreaker::EAiLineBreakClass }, //contour integral
+ { 0x222f, 0x2234, MLineBreaker::EAlLineBreakClass }, //surface integral
+ { 0x2234, 0x2238, MLineBreaker::EAiLineBreakClass }, //therefore
+ { 0x2238, 0x223c, MLineBreaker::EAlLineBreakClass }, //dot minus
+ { 0x223c, 0x223e, MLineBreaker::EAiLineBreakClass }, //tilde operator
+ { 0x223e, 0x2248, MLineBreaker::EAlLineBreakClass }, //inverted lazy s
+ { 0x2248, 0x2249, MLineBreaker::EAiLineBreakClass }, //almost equal to
+ { 0x2249, 0x224c, MLineBreaker::EAlLineBreakClass }, //not almost equal to
+ { 0x224c, 0x224d, MLineBreaker::EAiLineBreakClass }, //all equal to
+ { 0x224d, 0x2252, MLineBreaker::EAlLineBreakClass }, //equivalent to
+ { 0x2252, 0x2253, MLineBreaker::EAiLineBreakClass }, //approximately equal to or the image of
+ { 0x2253, 0x2260, MLineBreaker::EAlLineBreakClass }, //image of or approximately equal to
+ { 0x2260, 0x2262, MLineBreaker::EAiLineBreakClass }, //not equal to
+ { 0x2262, 0x2264, MLineBreaker::EAlLineBreakClass }, //not identical to
+ { 0x2264, 0x2268, MLineBreaker::EAiLineBreakClass }, //less-than or equal to
+ { 0x2268, 0x226a, MLineBreaker::EAlLineBreakClass }, //less-than but not equal to
+ { 0x226a, 0x226c, MLineBreaker::EAiLineBreakClass }, //much less-than
+ { 0x226c, 0x226e, MLineBreaker::EAlLineBreakClass }, //between
+ { 0x226e, 0x2270, MLineBreaker::EAiLineBreakClass }, //not less-than
+ { 0x2270, 0x2282, MLineBreaker::EAlLineBreakClass }, //neither less-than nor equal to
+ { 0x2282, 0x2284, MLineBreaker::EAiLineBreakClass }, //subset of
+ { 0x2284, 0x2286, MLineBreaker::EAlLineBreakClass }, //not a subset of
+ { 0x2286, 0x2288, MLineBreaker::EAiLineBreakClass }, //subset of or equal to
+ { 0x2288, 0x2295, MLineBreaker::EAlLineBreakClass }, //neither a subset of nor equal to
+ { 0x2295, 0x2296, MLineBreaker::EAiLineBreakClass }, //circled plus
+ { 0x2296, 0x2299, MLineBreaker::EAlLineBreakClass }, //circled minus
+ { 0x2299, 0x229a, MLineBreaker::EAiLineBreakClass }, //circled dot operator
+ { 0x229a, 0x22a5, MLineBreaker::EAlLineBreakClass }, //circled ring operator
+ { 0x22a5, 0x22a6, MLineBreaker::EAiLineBreakClass }, //up tack
+ { 0x22a6, 0x22bf, MLineBreaker::EAlLineBreakClass }, //assertion
+ { 0x22bf, 0x22c0, MLineBreaker::EAiLineBreakClass }, //right triangle
+ { 0x22c0, 0x2312, MLineBreaker::EAlLineBreakClass }, //n-ary logical and
+ { 0x2312, 0x2313, MLineBreaker::EAiLineBreakClass }, //arc
+ { 0x2313, 0x2329, MLineBreaker::EAlLineBreakClass }, //segment
+ { 0x2329, 0x232a, MLineBreaker::EOpLineBreakClass }, //left-pointing angle bracket
+ { 0x232a, 0x232b, MLineBreaker::EClLineBreakClass }, //right-pointing angle bracket
+ { 0x232b, 0x23e8, MLineBreaker::EAlLineBreakClass }, //erase to the left
+ { 0x2400, 0x2427, MLineBreaker::EAlLineBreakClass }, //symbol for null
+ { 0x2440, 0x244b, MLineBreaker::EAlLineBreakClass }, //ocr hook
+ { 0x2460, 0x24c0, MLineBreaker::EAiLineBreakClass }, //circled digit one
+ { 0x24c0, 0x24d0, MLineBreaker::EAlLineBreakClass }, //circled latin capital letter k
+ { 0x24d0, 0x24ea, MLineBreaker::EAiLineBreakClass }, //circled latin small letter a
+ { 0x24ea, 0x24eb, MLineBreaker::EAlLineBreakClass }, //circled digit zero
+ { 0x24eb, 0x24ff, MLineBreaker::EAiLineBreakClass }, //NEGATIVE CIRCLED NUMBER ELEVEN
+ { 0x24ff, 0x2500, MLineBreaker::EAlLineBreakClass }, //NEGATIVE CIRCLED DIGIT ZERO
+ { 0x2500, 0x254c, MLineBreaker::EAiLineBreakClass }, //box drawings light horizontal
+ { 0x254c, 0x2550, MLineBreaker::EAlLineBreakClass }, //box drawings light double dash horizontal
+ { 0x2550, 0x2575, MLineBreaker::EAiLineBreakClass }, //box drawings double horizontal
+ { 0x2575, 0x2580, MLineBreaker::EAlLineBreakClass }, //box drawings light up
+ { 0x2580, 0x2590, MLineBreaker::EAiLineBreakClass }, //upper half block
+ { 0x2590, 0x2592, MLineBreaker::EAlLineBreakClass }, //right half block
+ { 0x2592, 0x2596, MLineBreaker::EAiLineBreakClass }, //medium shade
+ { 0x2596, 0x25a0, MLineBreaker::EAlLineBreakClass }, //QUADRANT LOWER LEFT
+ { 0x25a0, 0x25a2, MLineBreaker::EAiLineBreakClass }, //black square
+ { 0x25a2, 0x25a3, MLineBreaker::EAlLineBreakClass }, //white square with rounded corners
+ { 0x25a3, 0x25aa, MLineBreaker::EAiLineBreakClass }, //white square containing black small square
+ { 0x25aa, 0x25b2, MLineBreaker::EAlLineBreakClass }, //black small square
+ { 0x25b2, 0x25b4, MLineBreaker::EAiLineBreakClass }, //black up-pointing triangle
+ { 0x25b4, 0x25b6, MLineBreaker::EAlLineBreakClass }, //black up-pointing small triangle
+ { 0x25b6, 0x25b8, MLineBreaker::EAiLineBreakClass }, //black right-pointing triangle
+ { 0x25b8, 0x25bc, MLineBreaker::EAlLineBreakClass }, //black right-pointing small triangle
+ { 0x25bc, 0x25be, MLineBreaker::EAiLineBreakClass }, //black down-pointing triangle
+ { 0x25be, 0x25c0, MLineBreaker::EAlLineBreakClass }, //black down-pointing small triangle
+ { 0x25c0, 0x25c2, MLineBreaker::EAiLineBreakClass }, //black left-pointing triangle
+ { 0x25c2, 0x25c6, MLineBreaker::EAlLineBreakClass }, //black left-pointing small triangle
+ { 0x25c6, 0x25c8, MLineBreaker::EAiLineBreakClass }, //black diamond
+ { 0x25c8, 0x25cb, MLineBreaker::EAlLineBreakClass }, //white diamond containing black small diamond
+ { 0x25cb, 0x25cc, MLineBreaker::EAiLineBreakClass }, //white circle
+ { 0x25cc, 0x25ce, MLineBreaker::EAlLineBreakClass }, //dotted circle
+ { 0x25ce, 0x25d2, MLineBreaker::EAiLineBreakClass }, //bullseye
+ { 0x25d2, 0x25e2, MLineBreaker::EAlLineBreakClass }, //circle with lower half black
+ { 0x25e2, 0x25e6, MLineBreaker::EAiLineBreakClass }, //black lower right triangle
+ { 0x25e6, 0x25ef, MLineBreaker::EAlLineBreakClass }, //white bullet
+ { 0x25ef, 0x25f0, MLineBreaker::EAiLineBreakClass }, //large circle
+ { 0x25f0, 0x2605, MLineBreaker::EAlLineBreakClass }, //white square with upper left quadrant
+ { 0x2605, 0x2607, MLineBreaker::EAiLineBreakClass }, //black star
+ { 0x2607, 0x2609, MLineBreaker::EAlLineBreakClass }, //lightning
+ { 0x2609, 0x260a, MLineBreaker::EAiLineBreakClass }, //sun
+ { 0x260a, 0x260e, MLineBreaker::EAlLineBreakClass }, //ascending node
+ { 0x260e, 0x2610, MLineBreaker::EAiLineBreakClass }, //black telephone
+ { 0x2610, 0x2614, MLineBreaker::EAlLineBreakClass }, //ballot box
+ { 0x2614, 0x2618, MLineBreaker::EAiLineBreakClass }, //UMBRELLA WITH RAIN DROPS
+ { 0x2618, 0x261c, MLineBreaker::EAlLineBreakClass }, //SHAMROCK
+ { 0x261c, 0x261d, MLineBreaker::EAiLineBreakClass }, //white left pointing index
+ { 0x261d, 0x261e, MLineBreaker::EAlLineBreakClass }, //white up pointing index
+ { 0x261e, 0x261f, MLineBreaker::EAiLineBreakClass }, //white right pointing index
+ { 0x261f, 0x2640, MLineBreaker::EAlLineBreakClass }, //white down pointing index
+ { 0x2640, 0x2641, MLineBreaker::EAiLineBreakClass }, //female sign
+ { 0x2641, 0x2642, MLineBreaker::EAlLineBreakClass }, //earth
+ { 0x2642, 0x2643, MLineBreaker::EAiLineBreakClass }, //male sign
+ { 0x2643, 0x2660, MLineBreaker::EAlLineBreakClass }, //jupiter
+ { 0x2660, 0x2662, MLineBreaker::EAiLineBreakClass }, //black spade suit
+ { 0x2662, 0x2663, MLineBreaker::EAlLineBreakClass }, //white diamond suit
+ { 0x2663, 0x2666, MLineBreaker::EAiLineBreakClass }, //black club suit
+ { 0x2666, 0x2667, MLineBreaker::EAlLineBreakClass }, //black diamond suit
+ { 0x2667, 0x266b, MLineBreaker::EAiLineBreakClass }, //white club suit
+ { 0x266b, 0x266c, MLineBreaker::EAlLineBreakClass }, //beamed eighth notes
+ { 0x266c, 0x266e, MLineBreaker::EAiLineBreakClass }, //beamed sixteenth notes
+ { 0x266e, 0x266f, MLineBreaker::EAlLineBreakClass }, //music natural sign
+ { 0x266f, 0x2670, MLineBreaker::EAiLineBreakClass }, //music sharp sign
+ { 0x2670, 0x269d, MLineBreaker::EAlLineBreakClass }, //west syriac cross
+ { 0x26a0, 0x26b3, MLineBreaker::EAlLineBreakClass }, //WARNING SIGN
+ { 0x2701, 0x2705, MLineBreaker::EAlLineBreakClass }, //upper blade scissors
+ { 0x2706, 0x270a, MLineBreaker::EAlLineBreakClass }, //telephone location sign
+ { 0x270c, 0x2728, MLineBreaker::EAlLineBreakClass }, //victory hand
+ { 0x2729, 0x274c, MLineBreaker::EAlLineBreakClass }, //stress outlined white star
+ { 0x274d, 0x274e, MLineBreaker::EAlLineBreakClass }, //shadowed white circle
+ { 0x274f, 0x2753, MLineBreaker::EAlLineBreakClass }, //lower right drop-shadowed white square
+ { 0x2756, 0x2757, MLineBreaker::EAlLineBreakClass }, //black diamond minus white x
+ { 0x2758, 0x275f, MLineBreaker::EAlLineBreakClass }, //light vertical bar
+ { 0x2761, 0x2768, MLineBreaker::EAlLineBreakClass }, //curved stem paragraph sign ornament
+ { 0x2768, 0x2769, MLineBreaker::EOpLineBreakClass }, //MEDIUM LEFT PARENTHESIS ORNAMENT
+ { 0x2769, 0x276a, MLineBreaker::EClLineBreakClass }, //MEDIUM RIGHT PARENTHESIS ORNAMENT
+ { 0x276a, 0x276b, MLineBreaker::EOpLineBreakClass }, //MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT
+ { 0x276b, 0x276c, MLineBreaker::EClLineBreakClass }, //MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT
+ { 0x276c, 0x276d, MLineBreaker::EOpLineBreakClass }, //MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT
+ { 0x276d, 0x276e, MLineBreaker::EClLineBreakClass }, //MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT
+ { 0x276e, 0x276f, MLineBreaker::EOpLineBreakClass }, //HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT
+ { 0x276f, 0x2770, MLineBreaker::EClLineBreakClass }, //HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT
+ { 0x2770, 0x2771, MLineBreaker::EOpLineBreakClass }, //HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT
+ { 0x2771, 0x2772, MLineBreaker::EClLineBreakClass }, //HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT
+ { 0x2772, 0x2773, MLineBreaker::EOpLineBreakClass }, //LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT
+ { 0x2773, 0x2774, MLineBreaker::EClLineBreakClass }, //LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT
+ { 0x2774, 0x2775, MLineBreaker::EOpLineBreakClass }, //MEDIUM LEFT CURLY BRACKET ORNAMENT
+ { 0x2775, 0x2776, MLineBreaker::EClLineBreakClass }, //MEDIUM RIGHT CURLY BRACKET ORNAMENT
+ { 0x2776, 0x2795, MLineBreaker::EAlLineBreakClass }, //dingbat negative circled digit one
+ { 0x2798, 0x27b0, MLineBreaker::EAlLineBreakClass }, //heavy south east arrow
+ { 0x27b1, 0x27bf, MLineBreaker::EAlLineBreakClass }, //notched upper right-shadowed white rightwards arrow
+ { 0x27c0, 0x27c5, MLineBreaker::EAlLineBreakClass }, //THREE DIMENSIONAL ANGLE
+ { 0x27c5, 0x27c6, MLineBreaker::EOpLineBreakClass }, //LEFT S-SHAPED BAG DELIMITER
+ { 0x27c6, 0x27c7, MLineBreaker::EClLineBreakClass }, //RIGHT S-SHAPED BAG DELIMITER
+ { 0x27c7, 0x27cb, MLineBreaker::EAlLineBreakClass }, //OR WITH DOT INSIDE
+ { 0x27d0, 0x27e6, MLineBreaker::EAlLineBreakClass }, //WHITE DIAMOND WITH CENTRED DOT
+ { 0x27e6, 0x27e7, MLineBreaker::EOpLineBreakClass }, //MATHEMATICAL LEFT WHITE SQUARE BRACKET
+ { 0x27e7, 0x27e8, MLineBreaker::EClLineBreakClass }, //MATHEMATICAL RIGHT WHITE SQUARE BRACKET
+ { 0x27e8, 0x27e9, MLineBreaker::EOpLineBreakClass }, //MATHEMATICAL LEFT ANGLE BRACKET
+ { 0x27e9, 0x27ea, MLineBreaker::EClLineBreakClass }, //MATHEMATICAL RIGHT ANGLE BRACKET
+ { 0x27ea, 0x27eb, MLineBreaker::EOpLineBreakClass }, //MATHEMATICAL LEFT DOUBLE ANGLE BRACKET
+ { 0x27eb, 0x27ec, MLineBreaker::EClLineBreakClass }, //MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET
+ { 0x27f0, 0x2983, MLineBreaker::EAlLineBreakClass }, //UPWARDS QUADRUPLE ARROW
+ { 0x2983, 0x2984, MLineBreaker::EOpLineBreakClass }, //LEFT WHITE CURLY BRACKET
+ { 0x2984, 0x2985, MLineBreaker::EClLineBreakClass }, //RIGHT WHITE CURLY BRACKET
+ { 0x2985, 0x2986, MLineBreaker::EOpLineBreakClass }, //LEFT WHITE PARENTHESIS
+ { 0x2986, 0x2987, MLineBreaker::EClLineBreakClass }, //RIGHT WHITE PARENTHESIS
+ { 0x2987, 0x2988, MLineBreaker::EOpLineBreakClass }, //Z NOTATION LEFT IMAGE BRACKET
+ { 0x2988, 0x2989, MLineBreaker::EClLineBreakClass }, //Z NOTATION RIGHT IMAGE BRACKET
+ { 0x2989, 0x298a, MLineBreaker::EOpLineBreakClass }, //Z NOTATION LEFT BINDING BRACKET
+ { 0x298a, 0x298b, MLineBreaker::EClLineBreakClass }, //Z NOTATION RIGHT BINDING BRACKET
+ { 0x298b, 0x298c, MLineBreaker::EOpLineBreakClass }, //LEFT SQUARE BRACKET WITH UNDERBAR
+ { 0x298c, 0x298d, MLineBreaker::EClLineBreakClass }, //RIGHT SQUARE BRACKET WITH UNDERBAR
+ { 0x298d, 0x298e, MLineBreaker::EOpLineBreakClass }, //LEFT SQUARE BRACKET WITH TICK IN TOP CORNER
+ { 0x298e, 0x298f, MLineBreaker::EClLineBreakClass }, //RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
+ { 0x298f, 0x2990, MLineBreaker::EOpLineBreakClass }, //LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
+ { 0x2990, 0x2991, MLineBreaker::EClLineBreakClass }, //RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER
+ { 0x2991, 0x2992, MLineBreaker::EOpLineBreakClass }, //LEFT ANGLE BRACKET WITH DOT
+ { 0x2992, 0x2993, MLineBreaker::EClLineBreakClass }, //RIGHT ANGLE BRACKET WITH DOT
+ { 0x2993, 0x2994, MLineBreaker::EOpLineBreakClass }, //LEFT ARC LESS-THAN BRACKET
+ { 0x2994, 0x2995, MLineBreaker::EClLineBreakClass }, //RIGHT ARC GREATER-THAN BRACKET
+ { 0x2995, 0x2996, MLineBreaker::EOpLineBreakClass }, //DOUBLE LEFT ARC GREATER-THAN BRACKET
+ { 0x2996, 0x2997, MLineBreaker::EClLineBreakClass }, //DOUBLE RIGHT ARC LESS-THAN BRACKET
+ { 0x2997, 0x2998, MLineBreaker::EOpLineBreakClass }, //LEFT BLACK TORTOISE SHELL BRACKET
+ { 0x2998, 0x2999, MLineBreaker::EClLineBreakClass }, //RIGHT BLACK TORTOISE SHELL BRACKET
+ { 0x2999, 0x29d8, MLineBreaker::EAlLineBreakClass }, //DOTTED FENCE
+ { 0x29d8, 0x29d9, MLineBreaker::EOpLineBreakClass }, //LEFT WIGGLY FENCE
+ { 0x29d9, 0x29da, MLineBreaker::EClLineBreakClass }, //RIGHT WIGGLY FENCE
+ { 0x29da, 0x29db, MLineBreaker::EOpLineBreakClass }, //LEFT DOUBLE WIGGLY FENCE
+ { 0x29db, 0x29dc, MLineBreaker::EClLineBreakClass }, //RIGHT DOUBLE WIGGLY FENCE
+ { 0x29dc, 0x29fc, MLineBreaker::EAlLineBreakClass }, //INCOMPLETE INFINITY
+ { 0x29fc, 0x29fd, MLineBreaker::EOpLineBreakClass }, //LEFT-POINTING CURVED ANGLE BRACKET
+ { 0x29fd, 0x29fe, MLineBreaker::EClLineBreakClass }, //RIGHT-POINTING CURVED ANGLE BRACKET
+ { 0x29fe, 0x2b1b, MLineBreaker::EAlLineBreakClass }, //TINY
+ { 0x2b20, 0x2b24, MLineBreaker::EAlLineBreakClass }, //WHITE PENTAGON
+ { 0x2c00, 0x2c2f, MLineBreaker::EAlLineBreakClass }, //GLAGOLITIC CAPITAL LETTER AZU
+ { 0x2c30, 0x2c5f, MLineBreaker::EAlLineBreakClass }, //GLAGOLITIC SMALL LETTER AZU
+ { 0x2c60, 0x2c6d, MLineBreaker::EAlLineBreakClass }, //LATIN CAPITAL LETTER L WITH DOUBLE BAR
+ { 0x2c74, 0x2c78, MLineBreaker::EAlLineBreakClass }, //LATIN SMALL LETTER V WITH CURL
+ { 0x2c80, 0x2ceb, MLineBreaker::EAlLineBreakClass }, //COPTIC CAPITAL LETTER ALFA
+ { 0x2cf9, 0x2cfd, MLineBreaker::EBaLineBreakClass }, //COPTIC OLD NUBIAN FULL STOP
+ { 0x2cfd, 0x2cfe, MLineBreaker::EAlLineBreakClass }, //COPTIC FRACTION ONE HALF
+ { 0x2cfe, 0x2d00, MLineBreaker::EBaLineBreakClass }, //COPTIC FULL STOP
+ { 0x2d00, 0x2d26, MLineBreaker::EAlLineBreakClass }, //GEORGIAN SMALL LETTER AN
+ { 0x2d30, 0x2d66, MLineBreaker::EAlLineBreakClass }, //TIFINAGH LETTER YA
+ { 0x2d6f, 0x2d70, MLineBreaker::EAlLineBreakClass }, //TIFINAGH MODIFIER LETTER LABIALIZATION MARK
+ { 0x2d80, 0x2d97, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE LOA
+ { 0x2da0, 0x2da7, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE SSA
+ { 0x2da8, 0x2daf, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE CCA
+ { 0x2db0, 0x2db7, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE ZZA
+ { 0x2db8, 0x2dbf, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE CCHA
+ { 0x2dc0, 0x2dc7, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE QYA
+ { 0x2dc8, 0x2dcf, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE KYA
+ { 0x2dd0, 0x2dd7, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE XYA
+ { 0x2dd8, 0x2ddf, MLineBreaker::EAlLineBreakClass }, //ETHIOPIC SYLLABLE GYA
+ { 0x2e00, 0x2e0e, MLineBreaker::EQuLineBreakClass }, //RIGHT ANGLE SUBSTITUTION MARKER
+ { 0x2e0e, 0x2e16, MLineBreaker::EBaLineBreakClass }, //EDITORIAL CORONIS
+ { 0x2e16, 0x2e17, MLineBreaker::EAlLineBreakClass }, //DOTTED RIGHT-POINTING ANGLE
+ { 0x2e17, 0x2e18, MLineBreaker::EBaLineBreakClass }, //DOUBLE OBLIQUE HYPHEN
+ { 0x2e1c, 0x2e1e, MLineBreaker::EQuLineBreakClass }, //LEFT LOW PARAPHRASE BRACKET
+ { 0x2e80, 0x2e9a, MLineBreaker::EIdLineBreakClass }, //cjk radical repeat
+ { 0x2e9b, 0x2ef4, MLineBreaker::EIdLineBreakClass }, //cjk radical choke
+ { 0x2f00, 0x2fd6, MLineBreaker::EIdLineBreakClass }, //kangxi radical one
+ { 0x2ff0, 0x2ffc, MLineBreaker::EIdLineBreakClass }, //ideographic description character left to right
+ { 0x3000, 0x3001, MLineBreaker::EIdLineBreakClass }, //ideographic space
+ { 0x3001, 0x3003, MLineBreaker::EClLineBreakClass }, //ideographic comma
+ { 0x3003, 0x3005, MLineBreaker::EIdLineBreakClass }, //ditto mark
+ { 0x3005, 0x3006, MLineBreaker::ENsLineBreakClass }, //ideographic iteration mark
+ { 0x3006, 0x3008, MLineBreaker::EIdLineBreakClass }, //ideographic closing mark
+ { 0x3008, 0x3009, MLineBreaker::EOpLineBreakClass }, //left angle bracket
+ { 0x3009, 0x300a, MLineBreaker::EClLineBreakClass }, //right angle bracket
+ { 0x300a, 0x300b, MLineBreaker::EOpLineBreakClass }, //left double angle bracket
+ { 0x300b, 0x300c, MLineBreaker::EClLineBreakClass }, //right double angle bracket
+ { 0x300c, 0x300d, MLineBreaker::EOpLineBreakClass }, //left corner bracket
+ { 0x300d, 0x300e, MLineBreaker::EClLineBreakClass }, //right corner bracket
+ { 0x300e, 0x300f, MLineBreaker::EOpLineBreakClass }, //left white corner bracket
+ { 0x300f, 0x3010, MLineBreaker::EClLineBreakClass }, //right white corner bracket
+ { 0x3010, 0x3011, MLineBreaker::EOpLineBreakClass }, //left black lenticular bracket
+ { 0x3011, 0x3012, MLineBreaker::EClLineBreakClass }, //right black lenticular bracket
+ { 0x3012, 0x3014, MLineBreaker::EIdLineBreakClass }, //postal mark
+ { 0x3014, 0x3015, MLineBreaker::EOpLineBreakClass }, //left tortoise shell bracket
+ { 0x3015, 0x3016, MLineBreaker::EClLineBreakClass }, //right tortoise shell bracket
+ { 0x3016, 0x3017, MLineBreaker::EOpLineBreakClass }, //left white lenticular bracket
+ { 0x3017, 0x3018, MLineBreaker::EClLineBreakClass }, //right white lenticular bracket
+ { 0x3018, 0x3019, MLineBreaker::EOpLineBreakClass }, //left white tortoise shell bracket
+ { 0x3019, 0x301a, MLineBreaker::EClLineBreakClass }, //right white tortoise shell bracket
+ { 0x301a, 0x301b, MLineBreaker::EOpLineBreakClass }, //left white square bracket
+ { 0x301b, 0x301c, MLineBreaker::EClLineBreakClass }, //right white square bracket
+ { 0x301c, 0x301d, MLineBreaker::ENsLineBreakClass }, //wave dash
+ { 0x301d, 0x301e, MLineBreaker::EOpLineBreakClass }, //reversed double prime quotation mark
+ { 0x301e, 0x3020, MLineBreaker::EClLineBreakClass }, //double prime quotation mark
+ { 0x3020, 0x302a, MLineBreaker::EIdLineBreakClass }, //postal mark face
+ { 0x302a, 0x3030, MLineBreaker::ECmLineBreakClass }, //ideographic level tone mark
+ { 0x3030, 0x303b, MLineBreaker::EIdLineBreakClass }, //wavy dash
+ { 0x303b, 0x303d, MLineBreaker::ENsLineBreakClass }, //VERTICAL IDEOGRAPHIC ITERATION MARK
+ { 0x303d, 0x3040, MLineBreaker::EIdLineBreakClass }, //PART ALTERNATION MARK
+ { 0x3041, 0x3042, MLineBreaker::ENsLineBreakClass }, //hiragana letter small a
+ { 0x3042, 0x3043, MLineBreaker::EIdLineBreakClass }, //hiragana letter a
+ { 0x3043, 0x3044, MLineBreaker::ENsLineBreakClass }, //hiragana letter small i
+ { 0x3044, 0x3045, MLineBreaker::EIdLineBreakClass }, //hiragana letter i
+ { 0x3045, 0x3046, MLineBreaker::ENsLineBreakClass }, //hiragana letter small u
+ { 0x3046, 0x3047, MLineBreaker::EIdLineBreakClass }, //hiragana letter u
+ { 0x3047, 0x3048, MLineBreaker::ENsLineBreakClass }, //hiragana letter small e
+ { 0x3048, 0x3049, MLineBreaker::EIdLineBreakClass }, //hiragana letter e
+ { 0x3049, 0x304a, MLineBreaker::ENsLineBreakClass }, //hiragana letter small o
+ { 0x304a, 0x3063, MLineBreaker::EIdLineBreakClass }, //hiragana letter o
+ { 0x3063, 0x3064, MLineBreaker::ENsLineBreakClass }, //hiragana letter small tu
+ { 0x3064, 0x3083, MLineBreaker::EIdLineBreakClass }, //hiragana letter tu
+ { 0x3083, 0x3084, MLineBreaker::ENsLineBreakClass }, //hiragana letter small ya
+ { 0x3084, 0x3085, MLineBreaker::EIdLineBreakClass }, //hiragana letter ya
+ { 0x3085, 0x3086, MLineBreaker::ENsLineBreakClass }, //hiragana letter small yu
+ { 0x3086, 0x3087, MLineBreaker::EIdLineBreakClass }, //hiragana letter yu
+ { 0x3087, 0x3088, MLineBreaker::ENsLineBreakClass }, //hiragana letter small yo
+ { 0x3088, 0x308e, MLineBreaker::EIdLineBreakClass }, //hiragana letter yo
+ { 0x308e, 0x308f, MLineBreaker::ENsLineBreakClass }, //hiragana letter small wa
+ { 0x308f, 0x3095, MLineBreaker::EIdLineBreakClass }, //hiragana letter wa
+ { 0x3095, 0x3097, MLineBreaker::ENsLineBreakClass }, //HIRAGANA LETTER SMALL KA
+ { 0x3099, 0x309b, MLineBreaker::ECmLineBreakClass }, //combining katakana-hiragana voiced sound mark
+ { 0x309b, 0x309f, MLineBreaker::ENsLineBreakClass }, //katakana-hiragana voiced sound mark
+ { 0x309f, 0x30a0, MLineBreaker::EIdLineBreakClass }, //HIRAGANA DIGRAPH YORI
+ { 0x30a0, 0x30a1, MLineBreaker::ENsLineBreakClass }, //KATAKANA-HIRAGANA DOUBLE HYPHEN
+ { 0x30a1, 0x30a2, MLineBreaker::ENsLineBreakClass }, //katakana letter small a
+ { 0x30a2, 0x30a3, MLineBreaker::EIdLineBreakClass }, //katakana letter a
+ { 0x30a3, 0x30a4, MLineBreaker::ENsLineBreakClass }, //katakana letter small i
+ { 0x30a4, 0x30a5, MLineBreaker::EIdLineBreakClass }, //katakana letter i
+ { 0x30a5, 0x30a6, MLineBreaker::ENsLineBreakClass }, //katakana letter small u
+ { 0x30a6, 0x30a7, MLineBreaker::EIdLineBreakClass }, //katakana letter u
+ { 0x30a7, 0x30a8, MLineBreaker::ENsLineBreakClass }, //katakana letter small e
+ { 0x30a8, 0x30a9, MLineBreaker::EIdLineBreakClass }, //katakana letter e
+ { 0x30a9, 0x30aa, MLineBreaker::ENsLineBreakClass }, //katakana letter small o
+ { 0x30aa, 0x30c3, MLineBreaker::EIdLineBreakClass }, //katakana letter o
+ { 0x30c3, 0x30c4, MLineBreaker::ENsLineBreakClass }, //katakana letter small tu
+ { 0x30c4, 0x30e3, MLineBreaker::EIdLineBreakClass }, //katakana letter tu
+ { 0x30e3, 0x30e4, MLineBreaker::ENsLineBreakClass }, //katakana letter small ya
+ { 0x30e4, 0x30e5, MLineBreaker::EIdLineBreakClass }, //katakana letter ya
+ { 0x30e5, 0x30e6, MLineBreaker::ENsLineBreakClass }, //katakana letter small yu
+ { 0x30e6, 0x30e7, MLineBreaker::EIdLineBreakClass }, //katakana letter yu
+ { 0x30e7, 0x30e8, MLineBreaker::ENsLineBreakClass }, //katakana letter small yo
+ { 0x30e8, 0x30ee, MLineBreaker::EIdLineBreakClass }, //katakana letter yo
+ { 0x30ee, 0x30ef, MLineBreaker::ENsLineBreakClass }, //katakana letter small wa
+ { 0x30ef, 0x30f5, MLineBreaker::EIdLineBreakClass }, //katakana letter wa
+ { 0x30f5, 0x30f7, MLineBreaker::ENsLineBreakClass }, //katakana letter small ka
+ { 0x30f7, 0x30fb, MLineBreaker::EIdLineBreakClass }, //katakana letter va
+ { 0x30fb, 0x30fc, MLineBreaker::ENsLineBreakClass }, //katakana middle dot
+ { 0x30fc, 0x30fd, MLineBreaker::EIdLineBreakClass }, //katakana-hiragana prolonged sound mark
+ { 0x30fd, 0x30fe, MLineBreaker::ENsLineBreakClass }, //katakana iteration mark
+ { 0x30fe, 0x30ff, MLineBreaker::EIdLineBreakClass }, //katakana voiced iteration mark
+ { 0x30ff, 0x3100, MLineBreaker::EIdLineBreakClass }, //KATAKANA DIGRAPH KOTO
+ { 0x3105, 0x312d, MLineBreaker::EIdLineBreakClass }, //bopomofo letter b
+ { 0x3131, 0x318f, MLineBreaker::EIdLineBreakClass }, //hangul letter kiyeok
+ { 0x3190, 0x31b8, MLineBreaker::EIdLineBreakClass }, //ideographic annotation linking mark
+ { 0x31c0, 0x31d0, MLineBreaker::EIdLineBreakClass }, //CJK STROKE T
+ { 0x31f0, 0x3200, MLineBreaker::ENsLineBreakClass }, //KATAKANA LETTER SMALL KU
+ { 0x3200, 0x321f, MLineBreaker::EIdLineBreakClass }, //parenthesized hangul kiyeok
+ { 0x3220, 0x3244, MLineBreaker::EIdLineBreakClass }, //parenthesized ideograph one
+ { 0x3250, 0x32ff, MLineBreaker::EIdLineBreakClass }, //PARTNERSHIP SIGN
+ { 0x3300, 0x4db6, MLineBreaker::EIdLineBreakClass }, //square apaato
+ { 0x4dc0, 0x4e00, MLineBreaker::EAlLineBreakClass }, //HEXAGRAM FOR THE CREATIVE HEAVEN
+ { 0x4e00, 0x9fbb, MLineBreaker::EIdLineBreakClass }, //<cjk ideograph,
+ { 0xa000, 0xa48d, MLineBreaker::EIdLineBreakClass }, //yi syllable it
+ { 0xa490, 0xa4c6, MLineBreaker::EIdLineBreakClass }, //yi radical qot
+ { 0xa4c6, 0xa4c7, MLineBreaker::EIdLineBreakClass }, //yi radical ke
+ { 0xa700, 0xa71b, MLineBreaker::EAlLineBreakClass }, //MODIFIER LETTER CHINESE TONE YIN PING
+ { 0xa720, 0xa722, MLineBreaker::EAlLineBreakClass }, //MODIFIER LETTER STRESS AND HIGH TONE
+ { 0xa800, 0xa802, MLineBreaker::EAlLineBreakClass }, //SYLOTI NAGRI LETTER A
+ { 0xa802, 0xa803, MLineBreaker::ECmLineBreakClass }, //SYLOTI NAGRI SIGN DVISVARA
+ { 0xa803, 0xa806, MLineBreaker::EAlLineBreakClass }, //SYLOTI NAGRI LETTER U
+ { 0xa806, 0xa807, MLineBreaker::ECmLineBreakClass }, //SYLOTI NAGRI SIGN HASANTA
+ { 0xa807, 0xa80b, MLineBreaker::EAlLineBreakClass }, //SYLOTI NAGRI LETTER KO
+ { 0xa80b, 0xa80c, MLineBreaker::ECmLineBreakClass }, //SYLOTI NAGRI SIGN ANUSVARA
+ { 0xa80c, 0xa823, MLineBreaker::EAlLineBreakClass }, //SYLOTI NAGRI LETTER CO
+ { 0xa823, 0xa828, MLineBreaker::ECmLineBreakClass }, //SYLOTI NAGRI VOWEL SIGN A
+ { 0xa828, 0xa82c, MLineBreaker::EAlLineBreakClass }, //SYLOTI NAGRI POETRY MARK-1
+ { 0xa840, 0xa874, MLineBreaker::EAlLineBreakClass }, //PHAGS-PA LETTER KA
+ { 0xa874, 0xa876, MLineBreaker::EBbLineBreakClass }, //PHAGS-PA SINGLE HEAD MARK
+ { 0xa876, 0xa878, MLineBreaker::EExLineBreakClass }, //PHAGS-PA MARK SHAD
+ { 0xac00, 0xd7a4, MLineBreaker::EIdLineBreakClass }, //<hangul syllable,
+ { 0xd800, 0xe000, MLineBreaker::ESgLineBreakClass }, //<non private use high surrogate,
+ { 0xe000, 0xf900, MLineBreaker::EAiLineBreakClass }, //<private use,
+ { 0xf900, 0xfa2e, MLineBreaker::EIdLineBreakClass }, //cjk compatibility ideograph-f900
+ { 0xfa30, 0xfa6b, MLineBreaker::EIdLineBreakClass }, //CJK COMPATIBILITY IDEOGRAPH-FA30
+ { 0xfa70, 0xfada, MLineBreaker::EIdLineBreakClass }, //CJK COMPATIBILITY IDEOGRAPH-FA70
+ { 0xfb00, 0xfb07, MLineBreaker::EAlLineBreakClass }, //latin small ligature ff
+ { 0xfb13, 0xfb18, MLineBreaker::EAlLineBreakClass }, //armenian small ligature men now
+ { 0xfb1d, 0xfb1e, MLineBreaker::EAlLineBreakClass }, //hebrew letter yod with hiriq
+ { 0xfb1e, 0xfb1f, MLineBreaker::ECmLineBreakClass }, //hebrew point judeo-spanish varika
+ { 0xfb1f, 0xfb37, MLineBreaker::EAlLineBreakClass }, //hebrew ligature yiddish yod yod patah
+ { 0xfb38, 0xfb3d, MLineBreaker::EAlLineBreakClass }, //hebrew letter tet with dagesh
+ { 0xfb3e, 0xfb3f, MLineBreaker::EAlLineBreakClass }, //hebrew letter mem with dagesh
+ { 0xfb40, 0xfb42, MLineBreaker::EAlLineBreakClass }, //hebrew letter nun with dagesh
+ { 0xfb43, 0xfb45, MLineBreaker::EAlLineBreakClass }, //hebrew letter final pe with dagesh
+ { 0xfb46, 0xfbb2, MLineBreaker::EAlLineBreakClass }, //hebrew letter tsadi with dagesh
+ { 0xfbd3, 0xfd3e, MLineBreaker::EAlLineBreakClass }, //arabic letter ng isolated form
+ { 0xfd3e, 0xfd3f, MLineBreaker::EOpLineBreakClass }, //ornate left parenthesis
+ { 0xfd3f, 0xfd40, MLineBreaker::EClLineBreakClass }, //ornate right parenthesis
+ { 0xfd50, 0xfd90, MLineBreaker::EAlLineBreakClass }, //arabic ligature teh with jeem with meem initial form
+ { 0xfd92, 0xfdc8, MLineBreaker::EAlLineBreakClass }, //arabic ligature meem with jeem with khah initial form
+ { 0xfdf0, 0xfdfc, MLineBreaker::EAlLineBreakClass }, //arabic ligature salla used as koranic stop sign isolated form
+ { 0xfdfc, 0xfdfd, MLineBreaker::EPoLineBreakClass }, //RIAL SIGN
+ { 0xfdfd, 0xfdfe, MLineBreaker::EAlLineBreakClass }, //ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM
+ { 0xfe00, 0xfe10, MLineBreaker::ECmLineBreakClass }, //VARIATION SELECTOR-1
+ { 0xfe10, 0xfe11, MLineBreaker::EIsLineBreakClass }, //PRESENTATION FORM FOR VERTICAL COMMA
+ { 0xfe11, 0xfe13, MLineBreaker::EClLineBreakClass }, //PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA
+ { 0xfe13, 0xfe15, MLineBreaker::EIsLineBreakClass }, //PRESENTATION FORM FOR VERTICAL COLON
+ { 0xfe15, 0xfe17, MLineBreaker::EExLineBreakClass }, //PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK
+ { 0xfe17, 0xfe18, MLineBreaker::EOpLineBreakClass }, //PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET
+ { 0xfe18, 0xfe19, MLineBreaker::EClLineBreakClass }, //PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET
+ { 0xfe19, 0xfe1a, MLineBreaker::EInLineBreakClass }, //PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS
+ { 0xfe20, 0xfe24, MLineBreaker::ECmLineBreakClass }, //combining ligature left half
+ { 0xfe30, 0xfe35, MLineBreaker::EIdLineBreakClass }, //presentation form for vertical two dot leader
+ { 0xfe35, 0xfe36, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left parenthesis
+ { 0xfe36, 0xfe37, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right parenthesis
+ { 0xfe37, 0xfe38, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left curly bracket
+ { 0xfe38, 0xfe39, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right curly bracket
+ { 0xfe39, 0xfe3a, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left tortoise shell bracket
+ { 0xfe3a, 0xfe3b, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right tortoise shell bracket
+ { 0xfe3b, 0xfe3c, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left black lenticular bracket
+ { 0xfe3c, 0xfe3d, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right black lenticular bracket
+ { 0xfe3d, 0xfe3e, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left double angle bracket
+ { 0xfe3e, 0xfe3f, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right double angle bracket
+ { 0xfe3f, 0xfe40, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left angle bracket
+ { 0xfe40, 0xfe41, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right angle bracket
+ { 0xfe41, 0xfe42, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left corner bracket
+ { 0xfe42, 0xfe43, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right corner bracket
+ { 0xfe43, 0xfe44, MLineBreaker::EOpLineBreakClass }, //presentation form for vertical left white corner bracket
+ { 0xfe44, 0xfe45, MLineBreaker::EClLineBreakClass }, //presentation form for vertical right white corner bracket
+ { 0xfe45, 0xfe47, MLineBreaker::EIdLineBreakClass }, //SESAME DOT
+ { 0xfe47, 0xfe48, MLineBreaker::EOpLineBreakClass }, //PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET
+ { 0xfe48, 0xfe49, MLineBreaker::EClLineBreakClass }, //PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET
+ { 0xfe49, 0xfe50, MLineBreaker::EIdLineBreakClass }, //dashed overline
+ { 0xfe50, 0xfe51, MLineBreaker::EClLineBreakClass }, //small comma
+ { 0xfe51, 0xfe52, MLineBreaker::EIdLineBreakClass }, //small ideographic comma
+ { 0xfe52, 0xfe53, MLineBreaker::EClLineBreakClass }, //small full stop
+ { 0xfe54, 0xfe56, MLineBreaker::ENsLineBreakClass }, //small semicolon
+ { 0xfe56, 0xfe58, MLineBreaker::EExLineBreakClass }, //small question mark
+ { 0xfe58, 0xfe59, MLineBreaker::EIdLineBreakClass }, //small em dash
+ { 0xfe59, 0xfe5a, MLineBreaker::EOpLineBreakClass }, //small left parenthesis
+ { 0xfe5a, 0xfe5b, MLineBreaker::EClLineBreakClass }, //small right parenthesis
+ { 0xfe5b, 0xfe5c, MLineBreaker::EOpLineBreakClass }, //small left curly bracket
+ { 0xfe5c, 0xfe5d, MLineBreaker::EClLineBreakClass }, //small right curly bracket
+ { 0xfe5d, 0xfe5e, MLineBreaker::EOpLineBreakClass }, //small left tortoise shell bracket
+ { 0xfe5e, 0xfe5f, MLineBreaker::EClLineBreakClass }, //small right tortoise shell bracket
+ { 0xfe5f, 0xfe67, MLineBreaker::EIdLineBreakClass }, //small number sign
+ { 0xfe68, 0xfe69, MLineBreaker::EIdLineBreakClass }, //small reverse solidus
+ { 0xfe69, 0xfe6a, MLineBreaker::EPrLineBreakClass }, //small dollar sign
+ { 0xfe6a, 0xfe6b, MLineBreaker::EPoLineBreakClass }, //small percent sign
+ { 0xfe6b, 0xfe6c, MLineBreaker::EAlLineBreakClass }, //small commercial at
+ { 0xfe70, 0xfe74, MLineBreaker::EAlLineBreakClass }, //arabic fathatan isolated form
+ { 0xfe74, 0xfe75, MLineBreaker::EAlLineBreakClass }, //arabic kasratan isolated form
+ { 0xfe76, 0xfefd, MLineBreaker::EAlLineBreakClass }, //arabic fatha isolated form
+ { 0xfeff, 0xff00, MLineBreaker::EGlLineBreakClass }, //zero width no-break space
+ { 0xff01, 0xff02, MLineBreaker::EExLineBreakClass }, //fullwidth exclamation mark
+ { 0xff02, 0xff04, MLineBreaker::EIdLineBreakClass }, //fullwidth quotation mark
+ { 0xff04, 0xff05, MLineBreaker::EPrLineBreakClass }, //fullwidth dollar sign
+ { 0xff05, 0xff06, MLineBreaker::EPoLineBreakClass }, //fullwidth percent sign
+ { 0xff06, 0xff08, MLineBreaker::EIdLineBreakClass }, //fullwidth ampersand
+ { 0xff08, 0xff09, MLineBreaker::EOpLineBreakClass }, //fullwidth left parenthesis
+ { 0xff09, 0xff0a, MLineBreaker::EClLineBreakClass }, //fullwidth right parenthesis
+ { 0xff0a, 0xff0c, MLineBreaker::EIdLineBreakClass }, //fullwidth asterisk
+ { 0xff0c, 0xff0d, MLineBreaker::EClLineBreakClass }, //fullwidth comma
+ { 0xff0d, 0xff0e, MLineBreaker::EIdLineBreakClass }, //fullwidth hyphen-minus
+ { 0xff0e, 0xff0f, MLineBreaker::EClLineBreakClass }, //fullwidth full stop
+ { 0xff0f, 0xff1a, MLineBreaker::EIdLineBreakClass }, //fullwidth solidus
+ { 0xff1a, 0xff1c, MLineBreaker::ENsLineBreakClass }, //fullwidth colon
+ { 0xff1c, 0xff1f, MLineBreaker::EIdLineBreakClass }, //fullwidth less-than sign
+ { 0xff1f, 0xff20, MLineBreaker::EExLineBreakClass }, //fullwidth question mark
+ { 0xff20, 0xff3b, MLineBreaker::EIdLineBreakClass }, //fullwidth commercial at
+ { 0xff3b, 0xff3c, MLineBreaker::EOpLineBreakClass }, //fullwidth left square bracket
+ { 0xff3c, 0xff3d, MLineBreaker::EIdLineBreakClass }, //fullwidth reverse solidus
+ { 0xff3d, 0xff3e, MLineBreaker::EClLineBreakClass }, //fullwidth right square bracket
+ { 0xff3e, 0xff5b, MLineBreaker::EIdLineBreakClass }, //fullwidth circumflex accent
+ { 0xff5b, 0xff5c, MLineBreaker::EOpLineBreakClass }, //fullwidth left curly bracket
+ { 0xff5c, 0xff5d, MLineBreaker::EIdLineBreakClass }, //fullwidth vertical line
+ { 0xff5d, 0xff5e, MLineBreaker::EClLineBreakClass }, //fullwidth right curly bracket
+ { 0xff5e, 0xff5f, MLineBreaker::EIdLineBreakClass }, //fullwidth tilde
+ { 0xff5f, 0xff60, MLineBreaker::EOpLineBreakClass }, //FULLWIDTH LEFT WHITE PARENTHESIS
+ { 0xff60, 0xff61, MLineBreaker::EClLineBreakClass }, //FULLWIDTH RIGHT WHITE PARENTHESIS
+ { 0xff61, 0xff62, MLineBreaker::EClLineBreakClass }, //halfwidth ideographic full stop
+ { 0xff62, 0xff63, MLineBreaker::EOpLineBreakClass }, //halfwidth left corner bracket
+ { 0xff63, 0xff65, MLineBreaker::EClLineBreakClass }, //halfwidth right corner bracket
+ { 0xff65, 0xff66, MLineBreaker::ENsLineBreakClass }, //halfwidth katakana middle dot
+ { 0xff66, 0xff67, MLineBreaker::EAlLineBreakClass }, //halfwidth katakana letter wo
+ { 0xff67, 0xff71, MLineBreaker::ENsLineBreakClass }, //halfwidth katakana letter small a
+ { 0xff71, 0xff9e, MLineBreaker::EAlLineBreakClass }, //halfwidth katakana letter a
+ { 0xff9e, 0xffa0, MLineBreaker::ENsLineBreakClass }, //halfwidth katakana voiced sound mark
+ { 0xffa0, 0xffbf, MLineBreaker::EAlLineBreakClass }, //halfwidth hangul filler
+ { 0xffc2, 0xffc8, MLineBreaker::EAlLineBreakClass }, //halfwidth hangul letter a
+ { 0xffca, 0xffd0, MLineBreaker::EAlLineBreakClass }, //halfwidth hangul letter yeo
+ { 0xffd2, 0xffd8, MLineBreaker::EAlLineBreakClass }, //halfwidth hangul letter yo
+ { 0xffda, 0xffdd, MLineBreaker::EAlLineBreakClass }, //halfwidth hangul letter eu
+ { 0xffe0, 0xffe1, MLineBreaker::EPoLineBreakClass }, //fullwidth cent sign
+ { 0xffe1, 0xffe2, MLineBreaker::EPrLineBreakClass }, //fullwidth pound sign
+ { 0xffe2, 0xffe5, MLineBreaker::EIdLineBreakClass }, //fullwidth not sign
+ { 0xffe5, 0xffe7, MLineBreaker::EPrLineBreakClass }, //fullwidth yen sign
+ { 0xffe8, 0xffef, MLineBreaker::EAlLineBreakClass }, //halfwidth forms light vertical
+ { 0xfff9, 0xfffc, MLineBreaker::ECmLineBreakClass }, //interlinear annotation anchor
+ { 0xfffc, 0xfffd, MLineBreaker::ECbLineBreakClass }, //object replacement character
+ { 0xfffd, 0xfffe, MLineBreaker::EAiLineBreakClass }, //replacement character
+ { 0x10000, 0x1000c, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYLLABLE B008 A
+ { 0x1000d, 0x10027, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYLLABLE B036 JO
+ { 0x10028, 0x1003b, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYLLABLE B060 RA
+ { 0x1003c, 0x1003e, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYLLABLE B017 ZA
+ { 0x1003f, 0x1004e, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYLLABLE B020 ZO
+ { 0x10050, 0x1005e, MLineBreaker::EAlLineBreakClass }, //LINEAR B SYMBOL B018
+ { 0x10080, 0x100fb, MLineBreaker::EAlLineBreakClass }, //LINEAR B IDEOGRAM B100 MAN
+ { 0x10100, 0x10103, MLineBreaker::EBaLineBreakClass }, //AEGEAN WORD SEPARATOR LINE
+ { 0x10107, 0x10134, MLineBreaker::EAlLineBreakClass }, //AEGEAN NUMBER ONE
+ { 0x10137, 0x1018b, MLineBreaker::EAlLineBreakClass }, //AEGEAN WEIGHT BASE UNIT
+ { 0x10300, 0x1031f, MLineBreaker::EAlLineBreakClass }, //OLD ITALIC LETTER A
+ { 0x10320, 0x10324, MLineBreaker::EAlLineBreakClass }, //OLD ITALIC NUMERAL ONE
+ { 0x10330, 0x1034b, MLineBreaker::EAlLineBreakClass }, //GOTHIC LETTER AHSA
+ { 0x10380, 0x1039e, MLineBreaker::EAlLineBreakClass }, //UGARITIC LETTER ALPA
+ { 0x1039f, 0x103a0, MLineBreaker::EBaLineBreakClass }, //UGARITIC WORD DIVIDER
+ { 0x103a0, 0x103c4, MLineBreaker::EAlLineBreakClass }, //OLD PERSIAN SIGN A
+ { 0x103c8, 0x103d0, MLineBreaker::EAlLineBreakClass }, //OLD PERSIAN SIGN AURAMAZDAA
+ { 0x103d0, 0x103d1, MLineBreaker::EBaLineBreakClass }, //OLD PERSIAN WORD DIVIDER
+ { 0x103d1, 0x103d6, MLineBreaker::EAlLineBreakClass }, //OLD PERSIAN NUMBER ONE
+ { 0x10400, 0x1049e, MLineBreaker::EAlLineBreakClass }, //DESERET CAPITAL LETTER LONG I
+ { 0x104a0, 0x104aa, MLineBreaker::ENuLineBreakClass }, //OSMANYA DIGIT ZERO
+ { 0x10800, 0x10806, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE A
+ { 0x10808, 0x10809, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE JO
+ { 0x1080a, 0x10836, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE KA
+ { 0x10837, 0x10839, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE XA
+ { 0x1083c, 0x1083d, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE ZA
+ { 0x1083f, 0x10840, MLineBreaker::EAlLineBreakClass }, //CYPRIOT SYLLABLE ZO
+ { 0x10900, 0x1091a, MLineBreaker::EAlLineBreakClass }, //PHOENICIAN LETTER ALF
+ { 0x1091f, 0x10920, MLineBreaker::EBaLineBreakClass }, //PHOENICIAN WORD SEPARATOR
+ { 0x10a00, 0x10a01, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI LETTER A
+ { 0x10a01, 0x10a04, MLineBreaker::ECmLineBreakClass }, //KHAROSHTHI VOWEL SIGN I
+ { 0x10a05, 0x10a07, MLineBreaker::ECmLineBreakClass }, //KHAROSHTHI VOWEL SIGN E
+ { 0x10a0c, 0x10a10, MLineBreaker::ECmLineBreakClass }, //KHAROSHTHI VOWEL LENGTH MARK
+ { 0x10a10, 0x10a14, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI LETTER KA
+ { 0x10a15, 0x10a18, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI LETTER CA
+ { 0x10a19, 0x10a34, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI LETTER NYA
+ { 0x10a38, 0x10a3b, MLineBreaker::ECmLineBreakClass }, //KHAROSHTHI SIGN BAR ABOVE
+ { 0x10a3f, 0x10a40, MLineBreaker::ECmLineBreakClass }, //KHAROSHTHI VIRAMA
+ { 0x10a40, 0x10a48, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI DIGIT ONE
+ { 0x10a50, 0x10a58, MLineBreaker::EBaLineBreakClass }, //KHAROSHTHI PUNCTUATION DOT
+ { 0x10a58, 0x10a59, MLineBreaker::EAlLineBreakClass }, //KHAROSHTHI PUNCTUATION LINES
+ { 0x12000, 0x1236f, MLineBreaker::EAlLineBreakClass }, //CUNEIFORM SIGN A
+ { 0x12400, 0x12463, MLineBreaker::EAlLineBreakClass }, //CUNEIFORM NUMERIC SIGN TWO ASH
+ { 0x12470, 0x12474, MLineBreaker::EBaLineBreakClass }, //CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER
+ { 0x1d000, 0x1d0f6, MLineBreaker::EAlLineBreakClass }, //BYZANTINE MUSICAL SYMBOL PSILI
+ { 0x1d100, 0x1d127, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL SINGLE BARLINE
+ { 0x1d12a, 0x1d165, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL DOUBLE SHARP
+ { 0x1d165, 0x1d16a, MLineBreaker::ECmLineBreakClass }, //MUSICAL SYMBOL COMBINING STEM
+ { 0x1d16a, 0x1d16d, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL FINGERED TREMOLO-1
+ { 0x1d16d, 0x1d183, MLineBreaker::ECmLineBreakClass }, //MUSICAL SYMBOL COMBINING AUGMENTATION DOT
+ { 0x1d183, 0x1d185, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL ARPEGGIATO UP
+ { 0x1d185, 0x1d18c, MLineBreaker::ECmLineBreakClass }, //MUSICAL SYMBOL COMBINING DOIT
+ { 0x1d18c, 0x1d1aa, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL RINFORZANDO
+ { 0x1d1aa, 0x1d1ae, MLineBreaker::ECmLineBreakClass }, //MUSICAL SYMBOL COMBINING DOWN BOW
+ { 0x1d1ae, 0x1d1de, MLineBreaker::EAlLineBreakClass }, //MUSICAL SYMBOL PEDAL MARK
+ { 0x1d200, 0x1d242, MLineBreaker::EAlLineBreakClass }, //GREEK VOCAL NOTATION SYMBOL-1
+ { 0x1d242, 0x1d245, MLineBreaker::ECmLineBreakClass }, //COMBINING GREEK MUSICAL TRISEME
+ { 0x1d245, 0x1d246, MLineBreaker::EAlLineBreakClass }, //GREEK MUSICAL LEIMMA
+ { 0x1d300, 0x1d357, MLineBreaker::EAlLineBreakClass }, //MONOGRAM FOR EARTH
+ { 0x1d360, 0x1d372, MLineBreaker::EAlLineBreakClass }, //COUNTING ROD UNIT DIGIT ONE
+ { 0x1d400, 0x1d455, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL BOLD CAPITAL A
+ { 0x1d456, 0x1d49d, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL ITALIC SMALL I
+ { 0x1d49e, 0x1d4a0, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT CAPITAL C
+ { 0x1d4a2, 0x1d4a3, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT CAPITAL G
+ { 0x1d4a5, 0x1d4a7, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT CAPITAL J
+ { 0x1d4a9, 0x1d4ad, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT CAPITAL N
+ { 0x1d4ae, 0x1d4ba, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT CAPITAL S
+ { 0x1d4bb, 0x1d4bc, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT SMALL F
+ { 0x1d4bd, 0x1d4c4, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT SMALL H
+ { 0x1d4c5, 0x1d506, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL SCRIPT SMALL P
+ { 0x1d507, 0x1d50b, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL FRAKTUR CAPITAL D
+ { 0x1d50d, 0x1d515, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL FRAKTUR CAPITAL J
+ { 0x1d516, 0x1d51d, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL FRAKTUR CAPITAL S
+ { 0x1d51e, 0x1d53a, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL FRAKTUR SMALL A
+ { 0x1d53b, 0x1d53f, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL DOUBLE-STRUCK CAPITAL D
+ { 0x1d540, 0x1d545, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL DOUBLE-STRUCK CAPITAL I
+ { 0x1d546, 0x1d547, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL DOUBLE-STRUCK CAPITAL O
+ { 0x1d54a, 0x1d551, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL DOUBLE-STRUCK CAPITAL S
+ { 0x1d552, 0x1d6a6, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL DOUBLE-STRUCK SMALL A
+ { 0x1d6a8, 0x1d7cc, MLineBreaker::EAlLineBreakClass }, //MATHEMATICAL BOLD CAPITAL ALPHA
+ { 0x1d7ce, 0x1d800, MLineBreaker::ENuLineBreakClass }, //MATHEMATICAL BOLD DIGIT ZERO
+ { 0x20000, 0x2a6d6, MLineBreaker::EIdLineBreakClass }, //<CJK Ideograph Extension B, First>..<CJK Ideograph Extension B, Last>
+ { 0x2f800, 0x2fa1e, MLineBreaker::EIdLineBreakClass }, //CJK COMPATIBILITY IDEOGRAPH-2F800
+ { 0xe0001, 0xe0002, MLineBreaker::ECmLineBreakClass }, //LANGUAGE TAG
+ { 0xe0020, 0xe0080, MLineBreaker::ECmLineBreakClass }, //TAG SPACE
+ { 0xe0100, 0xe01f0, MLineBreaker::ECmLineBreakClass }, //VARIATION SELECTOR-17
+ { 0xf0000, 0xffffd, MLineBreaker::EXxLineBreakClass }, //<Plane 15 Private Use, First>..<Plane 15 Private Use, Last>
+ { 0x100000, 0x10fffd, MLineBreaker::EXxLineBreakClass }, //<Plane 16 Private Use, First>..<Plane 16 Private Use, Last>
+ };
+
+static const TInt TheLineBreakRanges = sizeof(TheLineBreakRangeTable) / sizeof(TheLineBreakRangeTable[0]);
+
+void TestLineBreakTables(void)
+ {
+#ifdef _DEBUG
+ TUint prev_end = 0;
+ for (int i = 0; i < TheLineBreakRanges; i++)
+ {
+ const TLineBreakRange& r = TheLineBreakRangeTable[i];
+ if (r.iStart >= r.iEnd || r.iClass >= MLineBreaker::ELineBreakClasses || r.iStart < prev_end)
+ Panic(ELineBreakPanic_BadTable);
+ prev_end = r.iEnd;
+ }
+#endif
+ }
+
+TUint TLineBreakClassCache::LineBreakClass(TUint aChar)
+ {
+ if (aChar >= iStart && aChar < iEnd)
+ return iClass;
+ TUint new_start, new_end;
+ TUint new_class = iBreaker.LineBreakClass(aChar,new_start,new_end);
+ if (new_start < new_end - 1)
+ {
+ iStart = new_start;
+ iEnd = new_end;
+ iClass = new_class;
+ }
+ return new_class;
+ }
+
+EXPORT_C TBool MLineBreaker::LineBreakPossible(
+ TUint aPrevClass, TUint aNextClass, TBool aHaveSpaces) const
+/** Returns whether line breaks are legal between a character of line breaking
+class aPrevClass and aNextClass, with intervening spaces or not as determined
+by aHaveSpaces.
+
+@param aPrevClass The class before the potential line break.
+@param aNextClass The class after the potential line break.
+@param aHaveSpaces Whether spaces separate the characters.
+@return ETrue if and only if a line break is legal in the situation described. */
+ {
+ if (aPrevClass >= ELineBreakClasses || aNextClass >= ELineBreakClasses)
+ return FALSE;
+ const TLineBreakRule& rule = TheLineBreakRuleTable[aPrevClass];
+ TUint flag = 1 << aNextClass;
+ if (rule.iForbid & flag)
+ return FALSE;
+ return aHaveSpaces || (rule.iAllow & flag);
+ }
+
+EXPORT_C TUint MLineBreaker::LineBreakClass(TUint aCode,TUint& aRangeStart,TUint& aRangeEnd) const
+/** Converts Unicode character into line breaking class.
+
+@param aCode Input Unicode value.
+@param aRangeStart Returns the start of the contiguous range of characters
+including aCode that have the returned line breaking class.
+@param aRangeEnd Returns the end of the contiguous range of characters including
+aCode that have the returned line breaking class.
+@return The line breaking class for aCode. */
+ {
+ aRangeStart = aCode;
+ aRangeEnd = aCode + 1;
+
+ // First check for a space; this needs to be fast.
+ if (aCode == 0x0020)
+ return ESpLineBreakClass;
+
+ // Now search the table.
+ const TLineBreakRange* base = TheLineBreakRangeTable;
+ const TLineBreakRange* end = base + TheLineBreakRanges;
+ while (base < end)
+ {
+ int n = end - base;
+ const TLineBreakRange* r = &base[n / 2];
+ if (r->iStart > aCode)
+ end = r;
+ else if (r->iEnd <= aCode)
+ base = r + 1;
+ else
+ {
+ aRangeStart = r->iStart;
+ aRangeEnd = r->iEnd;
+ return r->iClass;
+ }
+ }
+
+ // If the character was not in the table determine the line break class using the Unicode character category.
+ TChar::TCategory cat = TChar(aCode).GetCategory();
+ switch (cat)
+ {
+ case TChar::ELuCategory:
+ case TChar::ELlCategory:
+ case TChar::ELtCategory:
+ case TChar::ELoCategory:
+ case TChar::ESmCategory:
+ case TChar::ESoCategory:
+ return EAlLineBreakClass;
+
+ case TChar::ESkCategory:
+ if (TChar(aCode).GetCjkWidth() == TChar::EWide)
+ return ENsLineBreakClass;
+ else
+ return EAlLineBreakClass;
+
+ case TChar::ELmCategory:
+ {
+ TChar::TCjkWidth cjk_width = TChar(aCode).GetCjkWidth();
+ if (cjk_width == TChar::EWide || cjk_width == TChar::EHalfWidth)
+ return ENsLineBreakClass;
+ }
+ break;
+
+ case TChar::EMnCategory:
+ case TChar::EMcCategory:
+ case TChar::EMeCategory:
+ case TChar::ECcCategory:
+ case TChar::ECfCategory:
+ return ECmLineBreakClass;
+
+ case TChar::ENdCategory:
+ return ENuLineBreakClass;
+
+ case TChar::EPsCategory:
+ return EOpLineBreakClass;
+
+ case TChar::EPeCategory:
+ return EClLineBreakClass;
+
+ case TChar::EScCategory:
+ return EPrLineBreakClass;
+
+ case TChar::EPfCategory:
+ case TChar::EPiCategory:
+ return EQuLineBreakClass;
+
+ case TChar::ECsCategory:
+ return ESgLineBreakClass;
+
+ default:
+ break;
+ }
+
+ // If it has still not been found it may be an ideographic character not covered above.
+ if (aCode >= 0x3000 && aCode <= 0x3FFF)
+ return EIdLineBreakClass;
+
+ // Or it may be a surrogate; assume plane 1 is alphabetic, plane 2 is ideographic.
+ if (aCode >= 0x10000 && aCode <= 0x1FFFF)
+ return EAlLineBreakClass;
+ if (aCode >= 0x20000 && aCode <= 0x2FFFF)
+ return EIdLineBreakClass;
+
+ // Return the catch-all class.
+ return EXxLineBreakClass;
+ }
+
+
+EXPORT_C TBool MLineBreaker::IsHangingCharacter(TUint) const
+/** Returns ETrue if the character value may be positioned outside the margins.
+
+@param aChar Chatacter to test
+@return ETrue if the character value may be positioned outside the margins. */
+ {
+ return EFalse;
+ }
+
+TInt MakeSurrogate(TInt aHigh, TInt aLow)
+ {
+ return (aHigh << 10) + (aLow & 0x3FF)
+ + (0x10000 - 0xD800*0x400);
+ }
+
+inline TBool IsSurrogate(TInt aChar)
+ {
+ return (aChar & 0xF800) == 0xD800;
+ }
+
+inline TBool IsHighSurrogate(TInt aChar)
+ {
+ return (aChar & 0xFC00) == 0xD800;
+ }
+
+inline TBool IsLowSurrogate(TInt aChar)
+ {
+ return (aChar & 0xFC00) == 0xDC00;
+ }
+
+/**
+Move past the current character and return the next.
+@param aPtr
+ Pointer to the current character. On return, contains a pointer to the next
+ character.
+@param aLimit
+ Limit of the iteration. For positive aOffset (moving forwards) this should
+ be one less than the end of the text. For negative aOffset (moving
+ backwards) this should be the start of the text.
+@param aOffset
+ 1 for moving forward, -1 for moving backward.
+@return
+ Unicode character value or -1 on error.
+@internalComponent
+*/
+TInt MoveTextPtr(const TText*& aPtr, const TText* aLimit, TInt aOffset)
+ {
+ // if (aPtr - aLimit) has the same sign as aOffset then we are
+ // already too far.
+ if (0 <= ((aPtr - aLimit) ^ aOffset)
+ && aLimit)
+ return -1;
+ TInt c = 0;
+ for (;;)
+ {
+ if (aPtr == aLimit)
+ return -1;
+ aPtr += aOffset;
+ TInt lastc = c;
+ c = *aPtr;
+ if (!IsSurrogate(c))
+ return c;
+ if (aOffset < 0)
+ {
+ if (IsHighSurrogate(c) && IsLowSurrogate(lastc))
+ return MakeSurrogate(c, lastc);
+ }
+ else
+ {
+ if (IsHighSurrogate(lastc) && IsLowSurrogate(c))
+ {
+ // found a surrogate pair
+ // Set the pointer to the first of the pair
+ --aPtr;
+ return MakeSurrogate(lastc, c);
+ }
+ }
+ }
+ }
+
+/** Find the line break class of the latest character within [aFirst, aP+1]
+to have non-CM line break class.
+@pre aP points to a character of CM class.
+*/
+inline TUint GetGlyphClusterLineBreakClass(const TText* aP,
+ const TText* aFirst, TLineBreakClassCache& aBreaker)
+ {
+ TInt ch = MoveTextPtr(aP, aFirst, -1);
+ while (0 <= ch)
+ {
+ TUint cl = aBreaker.LineBreakClass(ch);
+ if (cl != MLineBreaker::ECmLineBreakClass)
+ return cl;
+ ch = MoveTextPtr(aP, aFirst, -1);
+ }
+ return MLineBreaker::ECmLineBreakClass;
+ }
+
+void TLineBreakClassIterator::Set(const TText* aFirst, const TText* aText, TLineBreakClassCache& aBreaker)
+ {
+ iFirst = aFirst;
+ iCurrent = aText;
+ TInt c = *aText;
+ if (IsHighSurrogate(c))
+ {
+ if (IsLowSurrogate(aText[1]))
+ c = MakeSurrogate(c, aText[1]);
+ }
+ iClass = aBreaker.LineBreakClass(c);
+ if (iClass == MLineBreaker::ECmLineBreakClass)
+ {
+ TUint baseLbCls = GetGlyphClusterLineBreakClass(iCurrent, iFirst, aBreaker);
+ if (baseLbCls == MLineBreaker::ESaLineBreakClass)
+ iClass = MLineBreaker::ESaLineBreakClass;
+ }
+ }
+
+void TLineBreakClassIterator::SetNull()
+ {
+ iFirst = iCurrent = 0;
+ }
+
+TBool TLineBreakClassIterator::Move(const TText* aLimit,
+ const TText* aLimitAfterSpaces, TInt aOffset,
+ TBool& aHasSpaces, TLineBreakClassCache& aBreaker)
+ {
+ TInt c = MoveTextPtr(iCurrent, aLimit, aOffset);
+ if (c < 0)
+ return EFalse;
+ TUint lbClass = aBreaker.LineBreakClass(c);
+ if (lbClass == MLineBreaker::ESpLineBreakClass)
+ {
+ aHasSpaces = ETrue;
+ while (lbClass == MLineBreaker::ESpLineBreakClass)
+ {
+ c = MoveTextPtr(iCurrent, aLimitAfterSpaces, aOffset);
+ // We have hit the limit, but there might be more text to search
+ // after the spaces.
+ if (c < 0)
+ {
+ iClass = MLineBreaker::ESpLineBreakClass;
+ return ETrue;
+ }
+ lbClass = aBreaker.LineBreakClass(c);
+ }
+ iClass = lbClass;
+ return ETrue;
+ }
+
+ // Cm class characters taken on their base character's
+ // line break property in the combining character sequence
+ // See D14 in Conformance chapter of Unicode 3.0 book.
+ // We do this just for Complex content to maintain backwards
+ // compatibility otherwise original test cases fail.
+ if (lbClass == MLineBreaker::ECmLineBreakClass)
+ {
+ TUint baseLbCls = GetGlyphClusterLineBreakClass(iCurrent, iFirst, aBreaker);
+ if (baseLbCls == MLineBreaker::ESaLineBreakClass)
+ lbClass = MLineBreaker::ESaLineBreakClass;
+ }
+
+ aHasSpaces = EFalse;
+ if (lbClass == MLineBreaker::ESaLineBreakClass
+ && iClass == MLineBreaker::ESaLineBreakClass)
+ {
+ // We have at least two SA characters, so we need to find the
+ // total extent of the SA block. GetLineBreakInContext will be asked
+ // to find the break.
+ const TText* p = iCurrent;
+ while (0 <= c && lbClass == MLineBreaker::ESaLineBreakClass)
+ {
+ iCurrent = p;
+ c = MoveTextPtr(p, aOffset < 0? iFirst : aLimitAfterSpaces, aOffset);
+ lbClass = aBreaker.LineBreakClass(c);
+
+ // Cm class characters taken on their base character's
+ // line break property. See above.
+ if (lbClass == MLineBreaker::ECmLineBreakClass)
+ {
+ TUint baseLbCls = GetGlyphClusterLineBreakClass(p, iFirst, aBreaker);
+ if (baseLbCls == MLineBreaker::ESaLineBreakClass)
+ lbClass = MLineBreaker::ESaLineBreakClass;
+ }
+ if (lbClass == MLineBreaker::EZwLineBreakClass)
+ {
+ iCurrent = p;
+ }
+ }
+ return ETrue;
+ }
+ iClass = lbClass;
+ return ETrue;
+ }
+
+TLineBreakIterator::TLineBreakIterator(TLineBreakClassCache& aBreaker,
+ const TText* aText, TInt aLength, TBool aForwards,
+ TInt aMinBreakPos, TInt aMaxBreakPos)
+ : iBreaker(aBreaker), iText(aText), iTextLength(aLength), iHasSpaces(EFalse)
+ {
+ if (aMinBreakPos < 1)
+ aMinBreakPos = 1;
+ // Find the next valid character and see if it can hang
+ // over the margin.
+ const TText* endText = aText + aLength;
+ const TText* max = aText + aMaxBreakPos;
+ if (endText <= max && aText < endText)
+ {
+ // let 'max' point to last character
+ max = endText - 1;
+ if (IsLowSurrogate(*max))
+ {
+ ASSERT(aLength > 1);
+ --max;
+ ASSERT(IsHighSurrogate(*max));
+ }
+ }
+ TInt c = 0xFFFF;
+ while (max < endText)
+ {
+ TInt lastc = c;
+ c = *max;
+ if ((c & 0xF800) != 0xD800)
+ break;
+ if ((lastc & 0xFC00) == 0xD800
+ && (c & 0xFC00) == 0xDC00)
+ {
+ c = MakeSurrogate(lastc, c);
+ break;
+ }
+ ++max;
+ }
+ if (c != 0xFFFF && max + 1 < endText
+ && aBreaker.Breaker().IsHangingCharacter(c))
+ // Set max to just beyond hanging character
+ ++max;
+ // till here, 'max' points to the "end" of a character
+
+ // set up the iteration.
+ iMinBreakPos = aText + aMinBreakPos;
+ iMaxBreakPos = aText + aMaxBreakPos;
+ // Increment or Decrement must be called to complete set up.
+ if (max < aText + aMinBreakPos)
+ {
+ // no possible line breaks
+ iLimit = 0;
+ iAfterBreak.SetNull();
+ iBeforeBreak.SetNull();
+ }
+ else if (aForwards)
+ {
+ iLimit = max; // point to the 'end' of the last character (low surrogate if supplementary)
+ iLimitAfterSpaces = endText - 1;
+ iAfterBreak.Set(iText, aText + aMinBreakPos - 1, aBreaker);
+ }
+ else
+ {
+ iLimit = aText + aMinBreakPos - 1;
+ iLimitAfterSpaces = iLimit;
+ iBeforeBreak.Set(iText, max - 1, aBreaker);
+ iBeforeBreak.Move(endText - 1, endText - 1, 1, iHasSpaces, aBreaker);
+ }
+ }
+
+TBool TLineBreakIterator::IsBreak(TBool aForwards)
+ {
+ TInt beforeClass = iBeforeBreak.Class();
+ TInt afterClass = iAfterBreak.Class();
+ const MLineBreaker& breaker = iBreaker.Breaker();
+
+ // Line break characters overhang the margin
+ // along with the spaces that precede them.
+ if (afterClass == MLineBreaker::EBkLineBreakClass)
+ {
+ const TText* p = iAfterBreak.Ptr();
+ MoveTextPtr(p, iText + iTextLength, 1);
+ iAfterBreak.Set(iText, p, iBreaker);
+ return ETrue;
+ }
+
+ // Find break within this run of SA text
+ const TText* startOfSaText = iBeforeBreak.Ptr();
+ const TText* endOfSaText = iAfterBreak.Ptr();
+
+ if ((beforeClass != MLineBreaker::ESaLineBreakClass && *startOfSaText != KWhiteSpace) ||
+ (afterClass != MLineBreaker::ESaLineBreakClass))
+ // Complex (South-East Asian) line breaking rules not required.
+ return breaker.LineBreakPossible(beforeClass, afterClass, iHasSpaces);
+
+ MoveTextPtr(endOfSaText, iText + iTextLength, 1);
+ const TText* minBreak = startOfSaText < iMinBreakPos ?
+ iMinBreakPos : startOfSaText + 1;
+ const TText* maxBreak = iMaxBreakPos < endOfSaText ?
+ iMaxBreakPos : endOfSaText - 1;
+ TInt breakPos;
+ TPtrC saText(startOfSaText, endOfSaText - startOfSaText);
+ if (!breaker.GetLineBreakInContext(saText,
+ minBreak - startOfSaText, maxBreak - startOfSaText,
+ aForwards, breakPos))
+ return EFalse;
+
+ // Convert the break position within SA text into iterator positions.
+ const TText* p = startOfSaText + breakPos;
+ iAfterBreak.Set(iText, p, iBreaker);
+ if (*p != KZeroWidthSpace) MoveTextPtr(p, 0, -1);
+ iBeforeBreak.Set(iText, p, iBreaker);
+
+ return ETrue;
+ }
+
+TBool TLineBreakIterator::HasContingentBreak() const
+ {
+ return iBeforeBreak.Class() == MLineBreaker::ECbLineBreakClass
+ || iAfterBreak.Class() == MLineBreaker::ECbLineBreakClass;
+ }
+
+TInt TLineBreakIterator::PreviousClass() const
+ {
+ return iBeforeBreak.Class();
+ }
+
+TInt TLineBreakIterator::NextClass() const
+ {
+ return iAfterBreak.Class();
+ }
+
+TBool TLineBreakIterator::HasSpaces() const
+ {
+ return iHasSpaces;
+ }
+
+TBool TLineBreakIterator::Decrement()
+ {
+ iAfterBreak = iBeforeBreak;
+ return iBeforeBreak.Move(iLimit, iLimitAfterSpaces, -1, iHasSpaces, iBreaker);
+ }
+
+TBool TLineBreakIterator::Increment()
+ {
+ iBeforeBreak = iAfterBreak;
+ return iAfterBreak.Move(iLimit, iLimitAfterSpaces, 1, iHasSpaces, iBreaker);
+ }
+
+TInt TLineBreakIterator::BreakPos() const
+ {
+ const TText* t = iBeforeBreak.Ptr();
+ MoveTextPtr(t, 0, 1);
+ return t - iText;
+ }
+
+TInt TLineBreakIterator::BeforeBreakPos() const
+ {
+ return iBeforeBreak.Ptr() - iText;
+ }
+
+TInt TLineBreakIterator::AfterBreakPos() const
+ {
+ return iAfterBreak.Ptr() - iText;
+ }
+
+TBool HasContingentBreak(TLineBreakIterator& aIterator,
+ MContingentLineBreaker& aCbDelegate)
+ {
+ if (aIterator.PreviousClass() == MLineBreaker::ECbLineBreakClass
+ && aCbDelegate.IsLegalBreakAfter(
+ aIterator.BeforeBreakPos(), aIterator.NextClass(),
+ aIterator.HasSpaces()))
+ return ETrue;
+ if (aIterator.NextClass() == MLineBreaker::ECbLineBreakClass
+ && aCbDelegate.IsLegalBreakBefore(
+ aIterator.AfterBreakPos(), aIterator.PreviousClass(),
+ aIterator.HasSpaces()))
+ return ETrue;
+ return EFalse;
+ }
+
+TBool FindBreak(TLineBreakIterator& aIterator, TBool aForwards,
+ MContingentLineBreaker* aCbDelegate)
+ {
+ while (aForwards? aIterator.Increment() : aIterator.Decrement())
+ {
+ if (aCbDelegate && aIterator.HasContingentBreak())
+ {
+ if (HasContingentBreak(aIterator, *aCbDelegate))
+ {
+ return ETrue;
+ }
+ }
+ else if (aIterator.IsBreak(aForwards))
+ {
+ return ETrue;
+ }
+ }
+ return EFalse;
+ }
+
+TBool HasContingentBreakL(TLineBreakIterator& aIterator,
+ MContingentLineBreakerL& aCbDelegate)
+ {
+ if (aIterator.PreviousClass() == MLineBreaker::ECbLineBreakClass
+ && aCbDelegate.IsLegalBreakAfterL(
+ aIterator.BeforeBreakPos(), aIterator.NextClass(),
+ aIterator.HasSpaces()))
+ return ETrue;
+ if (aIterator.NextClass() == MLineBreaker::ECbLineBreakClass
+ && aCbDelegate.IsLegalBreakBeforeL(
+ aIterator.AfterBreakPos(), aIterator.PreviousClass(),
+ aIterator.HasSpaces()))
+ return ETrue;
+ return EFalse;
+ }
+
+TBool FindBreakL(TLineBreakIterator& aIterator, TBool aForwards,
+ MContingentLineBreakerL* aCbDelegate)
+ {
+ while (aForwards? aIterator.Increment() : aIterator.Decrement())
+ {
+ if (aCbDelegate && aIterator.HasContingentBreak())
+ {
+ if (HasContingentBreakL(aIterator, *aCbDelegate))
+ return ETrue;
+ }
+ else if (aIterator.IsBreak(aForwards))
+ return ETrue;
+ }
+ return EFalse;
+ }
+
+EXPORT_C TBool MLineBreaker::GetLineBreak(const TDesC& aText,
+ TInt aMinBreakPos, TInt aMaxBreakPos, TBool aForwards,
+ MContingentLineBreaker* aCbDelegate,
+ TInt& aBreakPos, TInt& aBreakPosAfterSpaces) const
+/** Finds the line break according to the rules in the virtual functions.
+
+@param aText The text to be broken.
+@param aMinBreakPos The smallest allowed result.
+@param aMaxBreakPos The position of the first character that fails to fit the
+measure.
+@param aForwards ETrue to find the earliest legal break opportunity, EFalse
+to find the last.
+@param aCbDelegate Object to resolve breaks around characters with the CB (cointingent
+break) line breaking class. Typically this class is only used for character
+0xFFFD, which usually marks the position of embedded pictures. May be NULL,
+in which case LineBreakPossible() determines whether these breaks are legal.
+@param aBreakPos Returns the position of the break.
+@param aBreakPosAfterSpaces Returns the position of the start of the next line.
+@return ETrue if successful, EFalse if no legal line breaks were found. */
+ {
+ TLineBreakClassCache cache(*this);
+ const TText* text = aText.Ptr();
+ TLineBreakIterator it(cache, text, aText.Length(),
+ aForwards, aMinBreakPos, aMaxBreakPos);
+ if (!FindBreak(it, aForwards, aCbDelegate))
+ return EFalse;
+ aBreakPos = it.BreakPos();
+ aBreakPosAfterSpaces = it.AfterBreakPos();
+ return ETrue;
+ }
+
+EXPORT_C TBool MLineBreaker::GetLineBreakL(const TDesC& aText,
+ TInt aMinBreakPos, TInt aMaxBreakPos, TBool aForwards,
+ MContingentLineBreakerL* aCbDelegate,
+ TInt& aBreakPos, TInt& aBreakPosAfterSpaces) const
+/** Exactly the same as GetLineBreak, but aCbDelegate's functions may leave so
+the whole function may leave.
+
+@param aText The text to be broken.
+@param aMinBreakPos The smallest allowed result.
+@param aMaxBreakPos he position of the first character that fails to fit the
+measure.
+@param aForwards ETrue to find the earliest legal break opportunity, EFalse
+to find the last.
+@param aCbDelegate Object to resolve breaks around characters with the CB (cointingent
+break) line breaking class. Typically this class is only used for character
+0xFFFD, which usually marks the position of embedded pictures. May be NULL,
+in which case LineBreakPossible() determines whether these breaks are legal.
+@param aBreakPos Returns the position of the break.
+@param aBreakPosAfterSpaces Returns the position of the start of the next line.
+@return ETrue if successful, EFalse if no legal line breaks were found. */
+ {
+ if (aMaxBreakPos < aMinBreakPos)
+ return EFalse;
+ TLineBreakClassCache cache(*this);
+ const TText* text = aText.Ptr();
+ TLineBreakIterator it(cache, text, aText.Length(),
+ aForwards, aMinBreakPos, aMaxBreakPos);
+ if (!FindBreakL(it, aForwards, aCbDelegate))
+ return EFalse;
+ aBreakPos = it.BreakPos();
+ aBreakPosAfterSpaces = it.AfterBreakPos();
+ return ETrue;
+ }
+EXPORT_C void* MLineBreaker::ExtendedInterface(TUid&) const
+/** Returns an interface to more functions, or 0 if these are unsupported.
+Currently there are no other functions, so 0 is always returned. If this
+function is overridden, it must base call if aUid is not recognised,
+rather than just returning 0.
+@param aUid Identifies the interface to be returned.
+@return A pointer to the extended interface, or 0 if not supported. */
+ {
+ return 0;
+ }
+
+