karthikshiraly/TestSolrTokenization.java

## TestSolrTokenization.java
public static void main(String[] args) {
		try {
			StringReader inputText = new StringReader("RUNNING runnable");

			Map<String, String> tkargs = new HashMap<String, String>();
			tkargs.put("luceneMatchVersion", "LUCENE_33");

			TokenizerFactory tkf = new WhitespaceTokenizerFactory();
			tkf.init(tkargs);
			Tokenizer tkz = tkf.create(inputText);

			LowerCaseFilterFactory lcf = new LowerCaseFilterFactory();
			lcf.init(tkargs);
			TokenStream lcts = lcf.create(tkz);

			TokenFilterFactory fcf = new SnowballPorterFilterFactory();
			Map<String, String> params = new HashMap<String, String>();
			params.put("language", "English");
			fcf.init(params);
			TokenStream ts = fcf.create(lcts);

			CharTermAttribute termAttrib = (CharTermAttribute) ts.getAttribute(CharTermAttribute.class);

			while (ts.incrementToken()) {
				String term = termAttrib.toString();
				System.out.println(term);
			}
		} catch (Exception e) {
			e.printStackTrace();
		}

		System.exit(0);
	}
	public static void main(String[] args) {
	try {
	StringReader inputText = new StringReader("RUNNING runnable");

	Map<String, String> tkargs = new HashMap<String, String>();
	tkargs.put("luceneMatchVersion", "LUCENE_33");

	TokenizerFactory tkf = new WhitespaceTokenizerFactory();
	tkf.init(tkargs);
	Tokenizer tkz = tkf.create(inputText);

	LowerCaseFilterFactory lcf = new LowerCaseFilterFactory();
	lcf.init(tkargs);
	TokenStream lcts = lcf.create(tkz);

	TokenFilterFactory fcf = new SnowballPorterFilterFactory();
	Map<String, String> params = new HashMap<String, String>();
	params.put("language", "English");
	fcf.init(params);
	TokenStream ts = fcf.create(lcts);

	CharTermAttribute termAttrib = (CharTermAttribute) ts.getAttribute(CharTermAttribute.class);

	while (ts.incrementToken()) {
	String term = termAttrib.toString();
	System.out.println(term);
	}
	} catch (Exception e) {
	e.printStackTrace();
	}

	System.exit(0);
	}