from nltk.stem.snowball import SnowballStemmer import nltk stemmer = SnowballStemmer("russian") tokens = nltk.word_tokenize('''Some text with words''') # TODO: remove nonwords symbols map(stemmer.stem, tokens)