summaryrefslogtreecommitdiffstats
path: root/JLanguageTool/src/java/de/danielnaber/languagetool/rules/AbstractPunctuationCheckRule.java
blob: 89d216bc8ae8acd437bffe9aa5a83042fa652dbf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
/* LanguageTool, a natural language style checker 
 * Copyright (C) 2005 Daniel Naber (http://www.danielnaber.de)
 * 
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301
 * USA
 */
package de.danielnaber.languagetool.rules;

import java.util.ArrayList;
import java.util.List;
import java.util.ResourceBundle;

import de.danielnaber.languagetool.AnalyzedSentence;
import de.danielnaber.languagetool.AnalyzedTokenReadings;

/**
 * A rule that matches "..", "::", "-," but not "...", "!..", "?!!", ",-" etc.
 * Languages will have to subclass it and override <code>isPunctsJoinOk()</code>
 * and <code>isPunctuation()</code> to provide language-specific checking
 * 
 * @author Andriy Rysin
 */
public abstract class AbstractPunctuationCheckRule extends Rule {

  public AbstractPunctuationCheckRule(final ResourceBundle messages) {
    super(messages);
    super.setCategory(new Category(messages.getString("category_misc")));
  }

  public String getId() {
    return "PUNCTUATION_GENERIC_CHECK";
  }

  public String getDescription() {
    return "Use of unusual combination of punctuation characters";
  }

  protected abstract boolean isPunctsJoinOk(String tkns);

  protected abstract boolean isPunctuation(String token);

  public RuleMatch[] match(final AnalyzedSentence text) {
    final List<RuleMatch> ruleMatches = new ArrayList<RuleMatch>();
    final AnalyzedTokenReadings[] tokens = text.getTokens();

    int startTokenIdx = -1;
    String tkns = "";
    for (int i = 0; i < tokens.length; i++) {
      final String tokenStr = tokens[i].getToken();

      if (isPunctuation(tokenStr)) {
        tkns += tokenStr;

        if (startTokenIdx == -1)
          startTokenIdx = i;

        if (i < tokens.length - 1)
          continue;
      }

      if (tkns.length() >= 2 && !isPunctsJoinOk(tkns)) {
        final String msg = "bad duplication or combination of punctuation signs";
        final RuleMatch ruleMatch = new RuleMatch(this, tokens[startTokenIdx]
            .getStartPos(),
            tokens[startTokenIdx].getStartPos() + tkns.length(), msg,
            "Punctuation problem");
        ruleMatch.setSuggestedReplacement(tkns.substring(0, 1));
        ruleMatches.add(ruleMatch);
      }
      tkns = "";
      startTokenIdx = -1;
    }

    return toRuleMatchArray(ruleMatches);
  }

  public void reset() {
    // nothing
  }

}