|
@@ -25,6 +25,7 @@ following types are supported:
|
|
|
<<irish-analyzer,`irish`>>,
|
|
|
<<italian-analyzer,`italian`>>,
|
|
|
<<latvian-analyzer,`latvian`>>,
|
|
|
+<<lithuanian-analyzer,`lithuanian`>>,
|
|
|
<<norwegian-analyzer,`norwegian`>>,
|
|
|
<<persian-analyzer,`persian`>>,
|
|
|
<<portuguese-analyzer,`portuguese`>>,
|
|
@@ -56,8 +57,9 @@ with the `keywords` set to the value of the `stem_exclusion` parameter.
|
|
|
The following analyzers support setting custom `stem_exclusion` list:
|
|
|
`arabic`, `armenian`, `basque`, `catalan`, `bulgarian`, `catalan`,
|
|
|
`czech`, `finnish`, `dutch`, `english`, `finnish`, `french`, `galician`,
|
|
|
-`german`, `irish`, `hindi`, `hungarian`, `indonesian`, `italian`, `latvian`, `norwegian`,
|
|
|
-`portuguese`, `romanian`, `russian`, `sorani`, `spanish`, `swedish`, `turkish`.
|
|
|
+`german`, `irish`, `hindi`, `hungarian`, `indonesian`, `italian`, `latvian`,
|
|
|
+`lithuanian`, `norwegian`, `portuguese`, `romanian`, `russian`, `sorani`,
|
|
|
+`spanish`, `swedish`, `turkish`.
|
|
|
|
|
|
==== Reimplementing language analyzers
|
|
|
|
|
@@ -1082,6 +1084,50 @@ The `latvian` analyzer could be reimplemented as a `custom` analyzer as follows:
|
|
|
<2> This filter should be removed unless there are words which should
|
|
|
be excluded from stemming.
|
|
|
|
|
|
+[[lithuanian-analyzer]]
|
|
|
+===== `lithuanian` analyzer
|
|
|
+
|
|
|
+The `lithuanian` analyzer could be reimplemented as a `custom` analyzer as follows:
|
|
|
+
|
|
|
+[source,js]
|
|
|
+----------------------------------------------------
|
|
|
+{
|
|
|
+ "settings": {
|
|
|
+ "analysis": {
|
|
|
+ "filter": {
|
|
|
+ "lithuanian_stop": {
|
|
|
+ "type": "stop",
|
|
|
+ "stopwords": "_lithuanian_" <1>
|
|
|
+ },
|
|
|
+ "lithuanian_keywords": {
|
|
|
+ "type": "keyword_marker",
|
|
|
+ "keywords": [] <2>
|
|
|
+ },
|
|
|
+ "lithuanian_stemmer": {
|
|
|
+ "type": "stemmer",
|
|
|
+ "language": "lithuanian"
|
|
|
+ }
|
|
|
+ },
|
|
|
+ "analyzer": {
|
|
|
+ "lithuanian": {
|
|
|
+ "tokenizer": "standard",
|
|
|
+ "filter": [
|
|
|
+ "lowercase",
|
|
|
+ "lithuanian_stop",
|
|
|
+ "lithuanian_keywords",
|
|
|
+ "lithuanian_stemmer"
|
|
|
+ ]
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+----------------------------------------------------
|
|
|
+<1> The default stopwords can be overridden with the `stopwords`
|
|
|
+ or `stopwords_path` parameters.
|
|
|
+<2> This filter should be removed unless there are words which should
|
|
|
+ be excluded from stemming.
|
|
|
+
|
|
|
[[norwegian-analyzer]]
|
|
|
===== `norwegian` analyzer
|
|
|
|