2015-10-08 22:20:33 +00:00
|
|
|
# Copyright (c) 2002-2015, International Business Machines Corporation and
|
2002-12-06 01:40:42 +00:00
|
|
|
# others. All Rights Reserved.
|
2002-06-25 17:23:07 +00:00
|
|
|
#
|
|
|
|
# Title Casing Break Rules
|
|
|
|
#
|
|
|
|
|
2014-03-04 19:58:04 +00:00
|
|
|
|
2002-06-25 17:23:07 +00:00
|
|
|
$CaseIgnorable = [[:Mn:][:Me:][:Cf:][:Lm:][:Sk:] \u0027 \u00AD \u2019];
|
2003-05-20 18:45:43 +00:00
|
|
|
$Cased = [[:Upper_Case:][:Lower_Case:][:Lt:] - $CaseIgnorable];
|
2014-03-04 19:58:04 +00:00
|
|
|
$NotCased = [[^ $Cased] - $CaseIgnorable];
|
2002-06-25 17:23:07 +00:00
|
|
|
|
2014-03-04 19:58:04 +00:00
|
|
|
!!forward;
|
|
|
|
|
|
|
|
# If the iterator begins on a CaseIgnorable, advance it past it/them.
|
|
|
|
# This can occur at the start-of-text, or after application of the
|
|
|
|
# safe-reverse rule.
|
|
|
|
|
|
|
|
($CaseIgnorable | $NotCased)*;
|
|
|
|
|
|
|
|
# Normal exact forward rule: beginning at the start of a word
|
|
|
|
# (at a cased character), advance through the word and through
|
|
|
|
# the uncased characters following the word.
|
|
|
|
|
|
|
|
$Cased ($Cased | $CaseIgnorable)* ($NotCased | $CaseIgnorable)*;
|
2003-05-21 20:07:41 +00:00
|
|
|
|
2002-06-25 17:23:07 +00:00
|
|
|
|
|
|
|
# Reverse Rules
|
2014-03-04 19:58:04 +00:00
|
|
|
!!reverse;
|
2002-06-25 17:23:07 +00:00
|
|
|
|
2014-03-04 19:58:04 +00:00
|
|
|
# Normal Rule, will work nearly universally, so long as there is a
|
|
|
|
# start-of-word preceding the current iteration position.
|
2003-11-05 23:50:39 +00:00
|
|
|
|
2014-03-04 19:58:04 +00:00
|
|
|
($NotCased | $CaseIgnorable)* ($Cased | $CaseIgnorable)* $Cased;
|
|
|
|
|
|
|
|
# Short rule, will be effective only when moving to the start of text,
|
|
|
|
# with no word (cased character) preceding the current iteration position.
|
|
|
|
|
|
|
|
($NotCased | $CaseIgnorable)*;
|
|
|
|
|
|
|
|
!!safe_reverse;
|
|
|
|
|
|
|
|
# Safe Reverse: the exact forward rule must not start in the middle
|
|
|
|
# of a word, so the safe reverse skips over any Cased characters,
|
|
|
|
# leaving it just before the start of a word.
|
|
|
|
|
|
|
|
($Cased | $CaseIgnorable)*;
|
|
|
|
|
|
|
|
!!safe_forward;
|
|
|
|
|
|
|
|
# Safe Forward, nothing needs to be done, the exact Reverse rules will
|
|
|
|
# always find valid boundaries from any starting position.
|
|
|
|
# Still, some rule is needed, so '.', a one character movement.
|
|
|
|
.;
|