Commit 6fdc318a by Sartika Aritonang

Upload New File

parent 74e357cf
#from Sastrawi.Stemmer.StemmerInterface import StemmerInterface
from Sastrawi.Stemmer.Filter import TextNormalizer
class CachedStemmer(object):
"""description of class"""
def __init__(self, cache, delegatedStemmer):
self.cache = cache
self.delegatedStemmer = delegatedStemmer
def stem(self, text):
normalizedText = TextNormalizer.normalize_text(text)
words = normalizedText.split(' ')
stems = []
for word in words:
if self.cache.has(word):
stems.append(self.cache.get(word))
else:
stem = self.delegatedStemmer.stem(word)
self.cache.set(word, stem)
stems.append(stem)
return ' '.join(stems)
def get_cache(self):
return self.cache
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment