[1]
@AnalyzerDef(name = "entityAnalyser",
tokenizer = @TokenizerDef(factory = StandardTokenizerFactory.class),
filters = { @TokenFilterDef(factory = StandardFilterFactory.class),
@TokenFilterDef(factory = LowerCaseFilterFactory.class),
@TokenFilterDef(factory = StopFilterFactory.class),
@TokenFilterDef(factory =
SnowballPorterFilterFactory.class, params = { @Parameter(name =
"language", value = "French")}),
@TokenFilterDef(factory = PhoneticFilterFactory.class
,params = { @Parameter(name="encoder", value="DoubleMetaphone")}),
@TokenFilterDef(factory = ASCIIFoldingFilterFactory.class),
@TokenFilterDef(factory = NGramFilterFactory.class,
params = { @Parameter(name = "minGramSize", value = "3"),
@Parameter(name = "maxGramSize", value = "3") })
}
,charFilters = { @CharFilterDef(factory =
HTMLStripCharFilterFactory.class) }
)
Doh, this poor string has been beaten to death!