scuffed-code/icu4c/source/data/translit/Han_Spacedhan.txt
2004-08-02 20:06:55 +00:00

25 lines
799 B
Plaintext

#--------------------------------------------------------------------
# Copyright (c) 1999-2004, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Only intended for internal use
:: fullwidth-halfwidth;
。 > '.';
$terminalPunct = [\.\,\:\;\?\!.,:?!。、;[:Pe:][:Pf:]];
$initialPunct = [:Ps:][:Pi:];
# add space between any Han or terminal punctuation and letters, and
# between letters and Han or initial punct
[[:Ideographic:] $terminalPunct] {} [:Letter:] > ' ' ;
[:Letter:] [:Mark:]* {} [[:Ideographic:] $initialPunct] > ' ' ;
# remove spacing between ideographs and other letters
< [:Ideographic:] { ' ' } [:Letter:] ;
< [:Letter:] [:Mark:]* { ' ' } [:Ideographic:] ;