Class LanguageIdentifier

java.lang.Object
org.languagetool.language.identifier.LanguageIdentifier
Direct Known Subclasses:
DefaultLanguageIdentifier, SimpleLanguageIdentifier

public abstract class LanguageIdentifier extends Object
  • Field Details

    • URL_REGEX

      private static final Pattern URL_REGEX
    • MAIL_REGEX

      private static final Pattern MAIL_REGEX
    • SIGNATURE

      private static final Pattern SIGNATURE
    • MENTION

      private static final Pattern MENTION
    • NBSP_INVIS_SEPARATOR

      private static final Pattern NBSP_INVIS_SEPARATOR
    • SCORE_THRESHOLD

      protected static final float SCORE_THRESHOLD
      See Also:
    • CONSIDER_ONLY_PREFERRED_THRESHOLD

      protected static final int CONSIDER_ONLY_PREFERRED_THRESHOLD
      See Also:
    • NON_LATIN_CHARS_LANGUAGES

      protected static final List<String> NON_LATIN_CHARS_LANGUAGES
    • REMOVE_EMAIL_SIGNATURE_FILTER

      protected static final com.optimaize.langdetect.text.TextFilter REMOVE_EMAIL_SIGNATURE_FILTER
    • REMOVE_MENTION_FILTER

      protected static final com.optimaize.langdetect.text.TextFilter REMOVE_MENTION_FILTER
    • REMOVE_NON_BREAKING_SPACES_FILTER

      protected static final com.optimaize.langdetect.text.TextFilter REMOVE_NON_BREAKING_SPACES_FILTER
    • REMOVE_URL_FILTER

      protected static final com.optimaize.langdetect.text.TextFilter REMOVE_URL_FILTER
    • UNICODE_BASED_LANG_IDENTIFIER

      protected static final UnicodeBasedDetector UNICODE_BASED_LANG_IDENTIFIER
    • COMMON_WORDS_LANG_IDENTIFIER

      protected static final CommonWordsDetector COMMON_WORDS_LANG_IDENTIFIER
    • maxLength

      protected int maxLength
  • Constructor Details

    • LanguageIdentifier

      public LanguageIdentifier(int maxLength)
  • Method Details