1 2 package net.nutch.analysis; 3 4 public interface NutchAnalysisConstants { 5 6 int EOF = 0; 7 int WORD = 1; 8 int ACRONYM = 2; 9 int SIGRAM = 3; 10 int IRREGULAR_WORD = 4; 11 int C_PLUS_PLUS = 5; 12 int C_SHARP = 6; 13 int PLUS = 7; 14 int MINUS = 8; 15 int QUOTE = 9; 16 int COLON = 10; 17 int SLASH = 11; 18 int DOT = 12; 19 int ATSIGN = 13; 20 int APOSTROPHE = 14; 21 int WHITE = 15; 22 int WORD_PUNCT = 16; 23 int LETTER = 17; 24 int CJK = 18; 25 int DIGIT = 19; 26 27 int DEFAULT = 0; 28 29 String [] tokenImage = { 30 "<EOF>", 31 "<WORD>", 32 "<ACRONYM>", 33 "<SIGRAM>", 34 "<IRREGULAR_WORD>", 35 "<C_PLUS_PLUS>", 36 "<C_SHARP>", 37 "\"+\"", 38 "\"-\"", 39 "\"\\\"\"", 40 "\":\"", 41 "\"/\"", 42 "\".\"", 43 "\"@\"", 44 "\"\\\'\"", 45 "<WHITE>", 46 "<WORD_PUNCT>", 47 "<LETTER>", 48 "<CJK>", 49 "<DIGIT>", 50 }; 51 52 } 53 | Popular Tags |