RETokenPOSIX.java 5.34 KB
Newer Older
Tom Tromey committed
1
/* gnu/regexp/RETokenPOSIX.java
2
   Copyright (C) 2006 Free Software Foundation, Inc.
Tom Tromey committed
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38

This file is part of GNU Classpath.

GNU Classpath is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2, or (at your option)
any later version.

GNU Classpath is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
General Public License for more details.

You should have received a copy of the GNU General Public License
along with GNU Classpath; see the file COPYING.  If not, write to the
Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
02110-1301 USA.

Linking this library statically or dynamically with other modules is
making a combined work based on this library.  Thus, the terms and
conditions of the GNU General Public License cover the whole
combination.

As a special exception, the copyright holders of this library give you
permission to link this library with independent modules to produce an
executable, regardless of the license terms of these independent
modules, and to copy and distribute the resulting executable under
terms of your choice, provided that you also meet, for each linked
independent module, the terms and conditions of the license of that
module.  An independent module is a module which is not derived from
or based on this library.  If you modify this library, you may extend
this exception to your version of the library, but you are not
obligated to do so.  If you do not wish to do so, delete this
exception statement from your version. */


39
package gnu.java.util.regex;
Tom Tromey committed
40

41 42 43 44
import gnu.java.lang.CPStringBuilder;

final class RETokenPOSIX extends REToken
{
Tom Tromey committed
45 46 47 48
  int type;
  boolean insens;
  boolean negated;

49 50 51 52 53 54 55 56 57 58 59
  static final int ALNUM = 0;
  static final int ALPHA = 1;
  static final int BLANK = 2;
  static final int CNTRL = 3;
  static final int DIGIT = 4;
  static final int GRAPH = 5;
  static final int LOWER = 6;
  static final int PRINT = 7;
  static final int PUNCT = 8;
  static final int SPACE = 9;
  static final int UPPER = 10;
Tom Tromey committed
60 61 62
  static final int XDIGIT = 11;

  // Array indices correspond to constants defined above.
63
  static final String[] s_nameTable = {
Tom Tromey committed
64
    "alnum", "alpha", "blank", "cntrl", "digit", "graph", "lower",
65
    "print", "punct", "space", "upper", "xdigit"
Tom Tromey committed
66 67 68
  };

  // The RE constructor uses this to look up the constant for a string
69 70 71 72
  static int intValue (String key)
  {
    for (int i = 0; i < s_nameTable.length; i++)
      {
73 74
        if (s_nameTable[i].equals (key))
          return i;
75
      }
Tom Tromey committed
76 77 78
    return -1;
  }

79 80 81
  RETokenPOSIX (int subIndex, int type, boolean insens, boolean negated)
  {
    super (subIndex);
Tom Tromey committed
82 83 84 85 86
    this.type = type;
    this.insens = insens;
    this.negated = negated;
  }

87 88 89 90
  int getMinimumLength ()
  {
    return 1;
  }
Tom Tromey committed
91

92 93 94 95
  int getMaximumLength ()
  {
    return 1;
  }
96

97 98 99 100 101 102
  REMatch matchThis (CharIndexed input, REMatch mymatch)
  {
    char ch = input.charAt (mymatch.index);
    boolean retval = matchOneChar (ch);
    if (retval)
      {
103 104
        ++mymatch.index;
        return mymatch;
105
      }
106 107
    return null;
  }
108

109 110
  boolean matchOneChar (char ch)
  {
Tom Tromey committed
111 112
    if (ch == CharIndexed.OUT_OF_BOUNDS)
      return false;
113

Tom Tromey committed
114
    boolean retval = false;
115 116 117
    switch (type)
      {
      case ALNUM:
118 119 120
        // Note that there is some debate over whether '_' should be included
        retval = Character.isLetterOrDigit (ch) || (ch == '_');
        break;
121
      case ALPHA:
122 123
        retval = Character.isLetter (ch);
        break;
124
      case BLANK:
125 126
        retval = ((ch == ' ') || (ch == '\t'));
        break;
127
      case CNTRL:
128 129
        retval = Character.isISOControl (ch);
        break;
130
      case DIGIT:
131 132
        retval = Character.isDigit (ch);
        break;
133
      case GRAPH:
134 135 136
        retval =
          (!(Character.isWhitespace (ch) || Character.isISOControl (ch)));
        break;
137
      case LOWER:
138 139 140
        retval = ((insens && Character.isLetter (ch))
                  || Character.isLowerCase (ch));
        break;
141
      case PRINT:
142 143 144 145
        retval =
          (!(Character.isWhitespace (ch) || Character.isISOControl (ch)))
          || (ch == ' ');
        break;
146
      case PUNCT:
147 148 149
        // This feels sloppy, especially for non-U.S. locales.
        retval = ("`~!@#$%^&*()-_=+[]{}\\|;:'\"/?,.<>".indexOf (ch) != -1);
        break;
150
      case SPACE:
151 152
        retval = Character.isWhitespace (ch);
        break;
153
      case UPPER:
154 155 156
        retval = ((insens && Character.isLetter (ch))
                  || Character.isUpperCase (ch));
        break;
157
      case XDIGIT:
158 159 160
        retval = (Character.isDigit (ch)
                  || ("abcdefABCDEF".indexOf (ch) != -1));
        break;
161
      }
Tom Tromey committed
162

163 164
    if (negated)
      retval = !retval;
165 166 167
    return retval;
  }

168 169 170 171
  boolean returnsFixedLengthMatches ()
  {
    return true;
  }
172

173 174 175 176 177 178
  int findFixedLengthMatches (CharIndexed input, REMatch mymatch, int max)
  {
    int index = mymatch.index;
    int numRepeats = 0;
    while (true)
      {
179 180 181 182 183 184
        if (numRepeats >= max)
          break;
        char ch = input.charAt (index++);
        if (!matchOneChar (ch))
          break;
        numRepeats++;
185
      }
186
    return numRepeats;
Tom Tromey committed
187 188
  }

189 190 191 192 193
  void dump (CPStringBuilder os)
  {
    if (negated)
      os.append ('^');
    os.append ("[:" + s_nameTable[type] + ":]");
Tom Tromey committed
194 195
  }
}