You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@xerces.apache.org by kn...@apache.org on 2001/10/15 20:30:40 UTC
cvs commit: xml-xerces/c/src/util/regx UnicodeRangeFactory.cpp

knoaman     01/10/15 11:30:40

  Modified:    c/src/util/regx UnicodeRangeFactory.cpp
  Log:
  Add support for 'Pi' and 'Pf'.
  
  Revision  Changes    Path
  1.4       +13 -17    xml-xerces/c/src/util/regx/UnicodeRangeFactory.cpp
  
  Index: UnicodeRangeFactory.cpp
  ===================================================================
  RCS file: /home/cvs/xml-xerces/c/src/util/regx/UnicodeRangeFactory.cpp,v
  retrieving revision 1.3
  retrieving revision 1.4
  diff -u -r1.3 -r1.4
  --- UnicodeRangeFactory.cpp	2001/05/11 13:26:51	1.3
  +++ UnicodeRangeFactory.cpp	2001/10/15 18:30:40	1.4
  @@ -56,6 +56,9 @@
   
   /*
    * $Log: UnicodeRangeFactory.cpp,v $
  + * Revision 1.4  2001/10/15 18:30:40  knoaman
  + * Add support for 'Pi' and 'Pf'.
  + *
    * Revision 1.3  2001/05/11 13:26:51  tng
    * Copyright update.
    *
  @@ -99,14 +102,14 @@
   // ---------------------------------------------------------------------------
   //  Local data
   // ---------------------------------------------------------------------------
  -const int            UNICATEGSIZE     = 35;
  -const unsigned short CHAR_LETTER      = 28;
  -const unsigned short CHAR_MARK        = 29;
  -const unsigned short CHAR_NUMBER      = 30;
  -const unsigned short CHAR_SEPARATOR   = 31;
  -const unsigned short CHAR_OTHER       = 32;
  -const unsigned short CHAR_PUNCTUATION = 33;
  -const unsigned short CHAR_SYMBOL      = 34;
  +const int            UNICATEGSIZE     = 37;
  +const unsigned short CHAR_LETTER      = 30;
  +const unsigned short CHAR_MARK        = 31;
  +const unsigned short CHAR_NUMBER      = 32;
  +const unsigned short CHAR_SEPARATOR   = 33;
  +const unsigned short CHAR_OTHER       = 34;
  +const unsigned short CHAR_PUNCTUATION = 35;
  +const unsigned short CHAR_SYMBOL      = 36;
   
   const XMLCh uniCategNames[][UNICATEGSIZE] =
   {
  @@ -138,6 +141,8 @@
       {chLatin_S, chLatin_c, chNull},
       {chLatin_S, chLatin_k, chNull},
       {chLatin_S, chLatin_o, chNull},
  +    {chLatin_P, chLatin_i, chNull},
  +    {chLatin_P, chLatin_f, chNull},
       {chLatin_L, chNull},
       {chLatin_M, chNull},
       {chLatin_N, chNull},
  @@ -181,15 +186,6 @@
       for (int j=0; j < 0x10000; j++) {
   
           unsigned short charType = XMLUniCharacter::getType(j);
  -
  -		// Assumption - treat initial punctuation as start punct.
  -		//            - treat final punctuation as end punct.
  -		if (charType == XMLUniCharacter::INITIAL_PUNCTUATION) {
  -            charType = XMLUniCharacter::START_PUNCTUATION;
  -        }
  -		else if (charType == XMLUniCharacter::FINAL_PUNCTUATION) {
  -            charType = XMLUniCharacter::END_PUNCTUATION;
  -        }
   
   		ranges[charType]->addRange(j, j);
   		charType = getUniCategory(charType);
  
  
  

---------------------------------------------------------------------
To unsubscribe, e-mail: xerces-cvs-unsubscribe@xml.apache.org
For additional commands, e-mail: xerces-cvs-help@xml.apache.org