|
@@ -375,6 +375,11 @@ public class BpeTokenizerTests extends BaseTokenStreamTestCase {
|
|
|
assertAnalyzesToNoCharFilter(analyzer, "Elasticsearch <<mask>.", new String[] { "Elast", "icsearch", "Ġ", "<", "<mask>", "." });
|
|
|
assertAnalyzesToNoCharFilter(analyzer, "Elasticsearch < red", new String[] { "Elast", "icsearch", "Ġ", "<", "Ġred" });
|
|
|
assertAnalyzesToNoCharFilter(analyzer, "Elasticsearch <mask>.", new String[] { "Elast", "icsearch", "<mask>", "." });
|
|
|
+ assertAnalyzesToNoCharFilter(
|
|
|
+ analyzer,
|
|
|
+ "Elasticsearch<mask><mask>~redElasticsearch",
|
|
|
+ new String[] { "Elast", "icsearch", "<mask>", "<mask>", "~", "red", "Elast", "icsearch" }
|
|
|
+ );
|
|
|
assertAnalyzesToNoCharFilter(
|
|
|
analyzer,
|
|
|
"Elasticsearch red~<mask>.",
|