OpenCores
URL https://opencores.org/ocsvn/openrisc/openrisc/trunk

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [libjava/] [classpath/] [gnu/] [java/] [text/] [SentenceBreakIterator.java] - Blame information for rev 769

Details | Compare with Previous | View Log

Line No. Rev Author Line
1 769 jeremybenn
/* SentenceBreakIterator.java - Default sentence BreakIterator.
2
   Copyright (C) 1999, 2001, 2002, 2004 Free Software Foundation, Inc.
3
 
4
This file is part of GNU Classpath.
5
 
6
GNU Classpath is free software; you can redistribute it and/or modify
7
it under the terms of the GNU General Public License as published by
8
the Free Software Foundation; either version 2, or (at your option)
9
any later version.
10
 
11
GNU Classpath is distributed in the hope that it will be useful, but
12
WITHOUT ANY WARRANTY; without even the implied warranty of
13
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
General Public License for more details.
15
 
16
You should have received a copy of the GNU General Public License
17
along with GNU Classpath; see the file COPYING.  If not, write to the
18
Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19
02110-1301 USA.
20
 
21
Linking this library statically or dynamically with other modules is
22
making a combined work based on this library.  Thus, the terms and
23
conditions of the GNU General Public License cover the whole
24
combination.
25
 
26
As a special exception, the copyright holders of this library give you
27
permission to link this library with independent modules to produce an
28
executable, regardless of the license terms of these independent
29
modules, and to copy and distribute the resulting executable under
30
terms of your choice, provided that you also meet, for each linked
31
independent module, the terms and conditions of the license of that
32
module.  An independent module is a module which is not derived from
33
or based on this library.  If you modify this library, you may extend
34
this exception to your version of the library, but you are not
35
obligated to do so.  If you do not wish to do so, delete this
36
exception statement from your version. */
37
 
38
 
39
package gnu.java.text;
40
 
41
import java.text.CharacterIterator;
42
 
43
/**
44
 * @author Tom Tromey <tromey@cygnus.com>
45
 * @date March 23, 1999
46
 * Written using The Unicode Standard, Version 2.0.
47
 */
48
 
49
public class SentenceBreakIterator extends BaseBreakIterator
50
{
51
  public Object clone ()
52
  {
53
    return new SentenceBreakIterator (this);
54
  }
55
 
56
  public SentenceBreakIterator ()
57
  {
58
  }
59
 
60
  private SentenceBreakIterator (SentenceBreakIterator other)
61
  {
62
    iter = (CharacterIterator) other.iter.clone();
63
  }
64
 
65
  public int next ()
66
  {
67
    int end = iter.getEndIndex();
68
    if (iter.getIndex() == end)
69
      return DONE;
70
 
71
    while (iter.getIndex() < end)
72
      {
73
        char c = iter.current();
74
        if (c == CharacterIterator.DONE)
75
          break;
76
        int type = Character.getType(c);
77
 
78
        char n = iter.next();
79
        if (n == CharacterIterator.DONE)
80
          break;
81
 
82
        // Always break after paragraph separator.
83
        if (type == Character.PARAGRAPH_SEPARATOR)
84
          break;
85
 
86
        if (c == '!' || c == '?')
87
          {
88
            // Skip close punctuation.
89
            while (n != CharacterIterator.DONE
90
                   && Character.getType(n) == Character.END_PUNCTUATION)
91
              n = iter.next();
92
            // Skip (java) space, line and paragraph separators.
93
            while (n != CharacterIterator.DONE && Character.isWhitespace(n))
94
              n = iter.next();
95
 
96
            // There's always a break somewhere after `!' or `?'.
97
            break;
98
          }
99
 
100
        if (c == '.')
101
          {
102
            int save = iter.getIndex();
103
            // Skip close punctuation.
104
            while (n != CharacterIterator.DONE
105
                   && Character.getType(n) == Character.END_PUNCTUATION)
106
              n = iter.next();
107
            // Skip (java) space, line and paragraph separators.
108
            // We keep count because we need at least one for this period to
109
            // represent a terminator.
110
            int spcount = 0;
111
            while (n != CharacterIterator.DONE && Character.isWhitespace(n))
112
              {
113
                n = iter.next();
114
                ++spcount;
115
              }
116
            if (spcount > 0)
117
              {
118
                int save2 = iter.getIndex();
119
                // Skip over open puncutation.
120
                while (n != CharacterIterator.DONE
121
                       && Character.getType(n) == Character.START_PUNCTUATION)
122
                  n = iter.next();
123
                // Next character must not be lower case.
124
                if (n == CharacterIterator.DONE
125
                    || ! Character.isLowerCase(n))
126
                  {
127
                    iter.setIndex(save2);
128
                    break;
129
                  }
130
              }
131
            iter.setIndex(save);
132
          }
133
      }
134
 
135
    return iter.getIndex();
136
  }
137
 
138
  private final int previous_internal ()
139
  {
140
    int start = iter.getBeginIndex();
141
    if (iter.getIndex() == start)
142
      return DONE;
143
 
144
    while (iter.getIndex() >= start)
145
      {
146
        char c = iter.previous();
147
        if (c == CharacterIterator.DONE)
148
          break;
149
 
150
        char n = iter.previous();
151
        if (n == CharacterIterator.DONE)
152
          break;
153
        iter.next();
154
        int nt = Character.getType(n);
155
 
156
        if (! Character.isLowerCase(c)
157
            && (nt == Character.START_PUNCTUATION
158
                || Character.isWhitespace(n)))
159
          {
160
            int save = iter.getIndex();
161
            int save_nt = nt;
162
            char save_n = n;
163
            // Skip open punctuation.
164
            while (n != CharacterIterator.DONE
165
                   && Character.getType(n) == Character.START_PUNCTUATION)
166
              n = iter.previous();
167
            if (n == CharacterIterator.DONE)
168
              break;
169
            if (Character.isWhitespace(n))
170
              {
171
                // Must have at least one (java) space after the `.'.
172
                int save2 = iter.getIndex();
173
                while (n != CharacterIterator.DONE
174
                       && Character.isWhitespace(n))
175
                  n = iter.previous();
176
                // Skip close punctuation.
177
                while (n != CharacterIterator.DONE
178
                       && Character.getType(n) == Character.END_PUNCTUATION)
179
                  n = iter.previous();
180
                if (n == CharacterIterator.DONE || n == '.')
181
                  {
182
                    // Communicate location of actual end.
183
                    period = iter.getIndex();
184
                    iter.setIndex(save2);
185
                    break;
186
                  }
187
              }
188
            iter.setIndex(save);
189
            nt = save_nt;
190
            n = save_n;
191
          }
192
 
193
        if (nt == Character.PARAGRAPH_SEPARATOR)
194
          {
195
            // Communicate location of actual end.
196
            period = iter.getIndex();
197
            break;
198
          }
199
        else if (Character.isWhitespace(n)
200
                 || nt == Character.END_PUNCTUATION)
201
          {
202
            int save = iter.getIndex();
203
            // Skip (java) space, line and paragraph separators.
204
            while (n != CharacterIterator.DONE
205
                   && Character.isWhitespace(n))
206
              n = iter.previous();
207
            // Skip close punctuation.
208
            while (n != CharacterIterator.DONE
209
                   && Character.getType(n) == Character.END_PUNCTUATION)
210
              n = iter.previous();
211
            int here = iter.getIndex();
212
            iter.setIndex(save);
213
            if (n == CharacterIterator.DONE || n == '!' || n == '?')
214
              {
215
                // Communicate location of actual end.
216
                period = here;
217
                break;
218
              }
219
          }
220
        else if (n == '!' || n == '?')
221
          {
222
            // Communicate location of actual end.
223
            period = iter.getIndex();
224
            break;
225
          }
226
      }
227
 
228
    return iter.getIndex();
229
  }
230
 
231
  public int previous ()
232
  {
233
    // We want to skip over the first sentence end to the second one.
234
    // However, at the end of the string we want the first end.
235
    int here = iter.getIndex();
236
    period = here;
237
    int first = previous_internal ();
238
    if (here == iter.getEndIndex() || first == DONE)
239
      return first;
240
    iter.setIndex(period);
241
    return previous_internal ();
242
  }
243
 
244
  // This is used for communication between previous and
245
  // previous_internal.
246
  private int period;
247
}

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.