001 /* 002 NGramJ - n-gram based text classification 003 Copyright (C) 2001 Frank S. Nestel (frank at spieleck.de) 004 005 This program is free software; you can redistribute it and/or modify 006 it under the terms of the GNU Lesser General Public License as published 007 by the Free Software Foundation; either version 2.1 of the License, or 008 (at your option) any later version. 009 010 This program is distributed in the hope that it will be useful, 011 but WITHOUT ANY WARRANTY; without even the implied warranty of 012 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 013 GNU General Public License for more details. 014 015 You should have received a copy of the GNU Lesser General Public License 016 along with this program (lesser.txt); if not, write to the Free Software 017 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. 018 */ 019 020 package de.spieleck.app.ngramj.lm; 021 022 /** 023 * Fairly abstract interface to model an ranking of NGrams. 024 */ 025 public interface LMConstants 026 { 027 /** 028 * Theses bytes seem to be considered skipable by text_cat in PERL. 029 */ 030 public static final byte[] SKIPABLE = new byte[] 031 {32,48,49,50,51,52,53,54,55,56,57,10,13}; 032 033 /** 034 * Effectively used NGrams from a text. 035 */ 036 public final static int USEDNGRAMS = 400; 037 } 038