You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@xerces.apache.org by kn...@apache.org on 2001/10/15 20:30:40 UTC
cvs commit: xml-xerces/c/src/util/regx UnicodeRangeFactory.cpp
knoaman 01/10/15 11:30:40
Modified: c/src/util/regx UnicodeRangeFactory.cpp
Log:
Add support for 'Pi' and 'Pf'.
Revision Changes Path
1.4 +13 -17 xml-xerces/c/src/util/regx/UnicodeRangeFactory.cpp
Index: UnicodeRangeFactory.cpp
===================================================================
RCS file: /home/cvs/xml-xerces/c/src/util/regx/UnicodeRangeFactory.cpp,v
retrieving revision 1.3
retrieving revision 1.4
diff -u -r1.3 -r1.4
--- UnicodeRangeFactory.cpp 2001/05/11 13:26:51 1.3
+++ UnicodeRangeFactory.cpp 2001/10/15 18:30:40 1.4
@@ -56,6 +56,9 @@
/*
* $Log: UnicodeRangeFactory.cpp,v $
+ * Revision 1.4 2001/10/15 18:30:40 knoaman
+ * Add support for 'Pi' and 'Pf'.
+ *
* Revision 1.3 2001/05/11 13:26:51 tng
* Copyright update.
*
@@ -99,14 +102,14 @@
// ---------------------------------------------------------------------------
// Local data
// ---------------------------------------------------------------------------
-const int UNICATEGSIZE = 35;
-const unsigned short CHAR_LETTER = 28;
-const unsigned short CHAR_MARK = 29;
-const unsigned short CHAR_NUMBER = 30;
-const unsigned short CHAR_SEPARATOR = 31;
-const unsigned short CHAR_OTHER = 32;
-const unsigned short CHAR_PUNCTUATION = 33;
-const unsigned short CHAR_SYMBOL = 34;
+const int UNICATEGSIZE = 37;
+const unsigned short CHAR_LETTER = 30;
+const unsigned short CHAR_MARK = 31;
+const unsigned short CHAR_NUMBER = 32;
+const unsigned short CHAR_SEPARATOR = 33;
+const unsigned short CHAR_OTHER = 34;
+const unsigned short CHAR_PUNCTUATION = 35;
+const unsigned short CHAR_SYMBOL = 36;
const XMLCh uniCategNames[][UNICATEGSIZE] =
{
@@ -138,6 +141,8 @@
{chLatin_S, chLatin_c, chNull},
{chLatin_S, chLatin_k, chNull},
{chLatin_S, chLatin_o, chNull},
+ {chLatin_P, chLatin_i, chNull},
+ {chLatin_P, chLatin_f, chNull},
{chLatin_L, chNull},
{chLatin_M, chNull},
{chLatin_N, chNull},
@@ -181,15 +186,6 @@
for (int j=0; j < 0x10000; j++) {
unsigned short charType = XMLUniCharacter::getType(j);
-
- // Assumption - treat initial punctuation as start punct.
- // - treat final punctuation as end punct.
- if (charType == XMLUniCharacter::INITIAL_PUNCTUATION) {
- charType = XMLUniCharacter::START_PUNCTUATION;
- }
- else if (charType == XMLUniCharacter::FINAL_PUNCTUATION) {
- charType = XMLUniCharacter::END_PUNCTUATION;
- }
ranges[charType]->addRange(j, j);
charType = getUniCategory(charType);
---------------------------------------------------------------------
To unsubscribe, e-mail: xerces-cvs-unsubscribe@xml.apache.org
For additional commands, e-mail: xerces-cvs-help@xml.apache.org