from janome.tokenizer import Tokenizer a="すもももももももものうち" tx = Tokenizer() for t in tx.tokenize(a): print(t.base_form)