@@ -247,108 +247,31 @@ public Map<String, AnalysisProvider<TokenizerFactory>> getTokenizers() {
247
247
@ Override
248
248
public List <PreBuiltAnalyzerProviderFactory > getPreBuiltAnalyzerProviderFactories () {
249
249
List <PreBuiltAnalyzerProviderFactory > analyzers = new ArrayList <>();
250
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("standard_html_strip" , CachingStrategy .LUCENE , version -> {
251
- Analyzer a = new StandardHtmlStripAnalyzer (CharArraySet .EMPTY_SET );
252
- a .setVersion (version .luceneVersion );
253
- return a ;
254
- }));
255
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("pattern" , CachingStrategy .ELASTICSEARCH , version -> {
256
- Analyzer a = new PatternAnalyzer (Regex .compile ("\\ W+" /*PatternAnalyzer.NON_WORD_PATTERN*/ , null ), true ,
257
- CharArraySet .EMPTY_SET );
258
- a .setVersion (version .luceneVersion );
259
- return a ;
260
- }));
261
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("snowball" , CachingStrategy .LUCENE , version -> {
262
- Analyzer a = new SnowballAnalyzer ("English" , StopAnalyzer .ENGLISH_STOP_WORDS_SET );
263
- a .setVersion (version .luceneVersion );
264
- return a ;
265
- }));
266
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("arabic" , CachingStrategy .LUCENE , version -> {
267
- Analyzer a = new ArabicAnalyzer ();
268
- a .setVersion (version .luceneVersion );
269
- return a ;
270
- }));
271
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("armenian" , CachingStrategy .LUCENE , version -> {
272
- Analyzer a = new ArmenianAnalyzer ();
273
- a .setVersion (version .luceneVersion );
274
- return a ;
275
- }));
276
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("basque" , CachingStrategy .LUCENE , version -> {
277
- Analyzer a = new BasqueAnalyzer ();
278
- a .setVersion (version .luceneVersion );
279
- return a ;
280
- }));
281
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("bengali" , CachingStrategy .LUCENE , version -> {
282
- Analyzer a = new BengaliAnalyzer ();
283
- a .setVersion (version .luceneVersion );
284
- return a ;
285
- }));
286
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("brazilian" , CachingStrategy .LUCENE , version -> {
287
- Analyzer a = new BrazilianAnalyzer ();
288
- a .setVersion (version .luceneVersion );
289
- return a ;
290
- }));
291
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("bulgarian" , CachingStrategy .LUCENE , version -> {
292
- Analyzer a = new BulgarianAnalyzer ();
293
- a .setVersion (version .luceneVersion );
294
- return a ;
295
- }));
296
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("catalan" , CachingStrategy .LUCENE , version -> {
297
- Analyzer a = new CatalanAnalyzer ();
298
- a .setVersion (version .luceneVersion );
299
- return a ;
300
- }));
301
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("chinese" , CachingStrategy .LUCENE , version -> {
302
- // only for old indices, best effort
303
- Analyzer a = new StandardAnalyzer ();
304
- a .setVersion (version .luceneVersion );
305
- return a ;
306
- }));
307
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("cjk" , CachingStrategy .LUCENE , version -> {
308
- Analyzer a = new CJKAnalyzer ();
309
- a .setVersion (version .luceneVersion );
310
- return a ;
311
- }));
312
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("czech" , CachingStrategy .LUCENE , version -> {
313
- Analyzer a = new CzechAnalyzer ();
314
- a .setVersion (version .luceneVersion );
315
- return a ;
316
- }));
317
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("danish" , CachingStrategy .LUCENE , version -> {
318
- Analyzer a = new DanishAnalyzer ();
319
- a .setVersion (version .luceneVersion );
320
- return a ;
321
- }));
322
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("dutch" , CachingStrategy .LUCENE , version -> {
323
- Analyzer a = new DutchAnalyzer ();
324
- a .setVersion (version .luceneVersion );
325
- return a ;
326
- }));
327
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("english" , CachingStrategy .LUCENE , version -> {
328
- Analyzer a = new EnglishAnalyzer ();
329
- a .setVersion (version .luceneVersion );
330
- return a ;
331
- }));
332
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("finnish" , CachingStrategy .LUCENE , version -> {
333
- Analyzer a = new FinnishAnalyzer ();
334
- a .setVersion (version .luceneVersion );
335
- return a ;
336
- }));
337
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("french" , CachingStrategy .LUCENE , version -> {
338
- Analyzer a = new FrenchAnalyzer ();
339
- a .setVersion (version .luceneVersion );
340
- return a ;
341
- }));
342
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("galician" , CachingStrategy .LUCENE , version -> {
343
- Analyzer a = new GalicianAnalyzer ();
344
- a .setVersion (version .luceneVersion );
345
- return a ;
346
- }));
347
- analyzers .add (new PreBuiltAnalyzerProviderFactory ("german" , CachingStrategy .LUCENE , version -> {
348
- Analyzer a = new GermanAnalyzer ();
349
- a .setVersion (version .luceneVersion );
350
- return a ;
351
- }));
250
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("standard_html_strip" , CachingStrategy .LUCENE ,
251
+ () -> new StandardHtmlStripAnalyzer (CharArraySet .EMPTY_SET )));
252
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("pattern" , CachingStrategy .ELASTICSEARCH ,
253
+ () -> new PatternAnalyzer (Regex .compile ("\\ W+" /*PatternAnalyzer.NON_WORD_PATTERN*/ , null ), true ,
254
+ CharArraySet .EMPTY_SET )));
255
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("snowball" , CachingStrategy .LUCENE ,
256
+ () -> new SnowballAnalyzer ("English" , StopAnalyzer .ENGLISH_STOP_WORDS_SET )));
257
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("arabic" , CachingStrategy .LUCENE , ArabicAnalyzer ::new ));
258
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("armenian" , CachingStrategy .LUCENE , ArmenianAnalyzer ::new ));
259
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("basque" , CachingStrategy .LUCENE , BasqueAnalyzer ::new ));
260
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("bengali" , CachingStrategy .LUCENE , BengaliAnalyzer ::new ));
261
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("brazilian" , CachingStrategy .LUCENE , BrazilianAnalyzer ::new ));
262
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("bulgarian" , CachingStrategy .LUCENE , BulgarianAnalyzer ::new ));
263
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("catalan" , CachingStrategy .LUCENE , CatalanAnalyzer ::new ));
264
+ // chinese analyzer: only for old indices, best effort
265
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("chinese" , CachingStrategy .LUCENE , StandardAnalyzer ::new ));
266
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("cjk" , CachingStrategy .LUCENE , CJKAnalyzer ::new ));
267
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("czech" , CachingStrategy .LUCENE , CzechAnalyzer ::new ));
268
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("danish" , CachingStrategy .LUCENE , DanishAnalyzer ::new ));
269
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("dutch" , CachingStrategy .LUCENE , DutchAnalyzer ::new ));
270
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("english" , CachingStrategy .LUCENE , EnglishAnalyzer ::new ));
271
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("finnish" , CachingStrategy .LUCENE , FinnishAnalyzer ::new ));
272
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("french" , CachingStrategy .LUCENE , FrenchAnalyzer ::new ));
273
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("galician" , CachingStrategy .LUCENE , GalicianAnalyzer ::new ));
274
+ analyzers .add (new PreBuiltAnalyzerProviderFactory ("german" , CachingStrategy .LUCENE , GermanAnalyzer ::new ));
352
275
return analyzers ;
353
276
}
354
277
0 commit comments