diff options
Diffstat (limited to 'JLanguageTool/src/java/de/danielnaber/languagetool/language/Polish.java')
-rw-r--r-- | JLanguageTool/src/java/de/danielnaber/languagetool/language/Polish.java | 116 |
1 files changed, 116 insertions, 0 deletions
diff --git a/JLanguageTool/src/java/de/danielnaber/languagetool/language/Polish.java b/JLanguageTool/src/java/de/danielnaber/languagetool/language/Polish.java new file mode 100644 index 0000000..13b4faf --- /dev/null +++ b/JLanguageTool/src/java/de/danielnaber/languagetool/language/Polish.java @@ -0,0 +1,116 @@ +/* LanguageTool, a natural language style checker + * Copyright (C) 2007 Daniel Naber (http://www.danielnaber.de) + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with this library; if not, write to the Free Software + * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 + * USA + */ +package de.danielnaber.languagetool.language; + +import java.util.HashSet; +import java.util.Locale; +import java.util.Set; + +import de.danielnaber.languagetool.Language; +import de.danielnaber.languagetool.rules.patterns.Unifier; +import de.danielnaber.languagetool.synthesis.Synthesizer; +import de.danielnaber.languagetool.synthesis.pl.PolishSynthesizer; +import de.danielnaber.languagetool.tagging.Tagger; +import de.danielnaber.languagetool.tagging.disambiguation.Disambiguator; +import de.danielnaber.languagetool.tagging.disambiguation.pl.PolishHybridDisambiguator; +import de.danielnaber.languagetool.tagging.pl.PolishTagger; +import de.danielnaber.languagetool.tokenizers.SentenceTokenizer; +import de.danielnaber.languagetool.tokenizers.SRXSentenceTokenizer; + +public class Polish extends Language { + + private final Tagger tagger = new PolishTagger(); + private final SentenceTokenizer sentenceTokenizer = new SRXSentenceTokenizer("pl"); + private final Disambiguator disambiguator = new PolishHybridDisambiguator(); + private final Synthesizer synthesizer = new PolishSynthesizer(); + private static final Unifier POLISH_UNIFIER = new Unifier(); + private static final Unifier POLISH_DISAMB_UNIFIER = new Unifier(); + + private static final String[] COUNTRIES = {"PL"}; + + @Override + public Locale getLocale() { + return new Locale(getShortName()); + } + + @Override + public String getName() { + return "Polish"; + } + + @Override + public String getShortName() { + return "pl"; + } + + @Override + public String[] getCountryVariants() { + return COUNTRIES; + } + + @Override + public Tagger getTagger() { + return tagger; + } + + @Override + public SentenceTokenizer getSentenceTokenizer() { + return sentenceTokenizer; + } + + @Override + public Disambiguator getDisambiguator() { + return disambiguator; + } + + public Unifier getUnifier() { + return POLISH_UNIFIER; + } + + public Unifier getDisambiguationUnifier() { + return POLISH_DISAMB_UNIFIER; + } + + @Override + public Synthesizer getSynthesizer() { + return synthesizer; + } + + @Override + public Contributor[] getMaintainers() { + return new Contributor[] {new Contributor("Marcin MiĆkowski")}; + } + + @Override + public Set<String> getRelevantRuleIDs() { + final Set<String> ids = new HashSet<String>(); + ids.add("COMMA_PARENTHESIS_WHITESPACE"); + ids.add("DOUBLE_PUNCTUATION"); + ids.add("UPPERCASE_SENTENCE_START"); + ids.add("WORD_REPEAT_RULE"); + ids.add("WHITESPACE_RULE"); + // specific to Polish: + ids.add("PL_UNPAIRED_BRACKETS"); + ids.add("PL_WORD_REPEAT"); + ids.add("PL_COMPOUNDS"); + ids.add("PL_SIMPLE_REPLACE"); + return ids; + } + +} |