# Integration tests for ICU analysis components
#
"Tokenizer":
    - do:
        indices.analyze:
          text:         関西国際空港
          tokenizer:    kuromoji_tokenizer
    - length: { tokens: 4 }
    - match:  { tokens.0.token: 関西 }
    - match:  { tokens.1.token: 関西国際空港 }
    - match:  { tokens.2.token: 国際 }
    - match:  { tokens.3.token: 空港 }
---
"Baseform filter":
    - do:
        indices.analyze:
          text:         飲み
          tokenizer:    kuromoji_tokenizer
          filters:      kuromoji_baseform
    - length: { tokens: 1 }
    - match:  { tokens.0.token: 飲む }
---
"Reading filter":
    - do:
        indices.analyze:
          text:         寿司
          tokenizer:    kuromoji_tokenizer
          filters:      kuromoji_readingform
    - length: { tokens: 1 }
    - match:  { tokens.0.token: sushi }
---
"Stemming filter":
    - do:
        indices.analyze:
          text:         サーバー
          tokenizer:    kuromoji_tokenizer
          filters:      kuromoji_stemmer
    - length: { tokens: 1 }
    - match:  { tokens.0.token: サーバ }