File size: 534 Bytes
d3c86fd |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 |
import nltk
from sumy.parsers.plaintext import PlaintextParser
from sumy.summarizers.luhn import LuhnSummarizer
from sumy.nlp.tokenizers import Tokenizer
nltk.download('punkt')
def summarize(file, SENTENCES_COUNT):
sumarizer = LuhnSummarizer()
with open(file.name) as f:
doc = f.read()
sentences_ = []
doc_ = PlaintextParser(doc, Tokenizer("en")).document
for sentence in sumarizer(doc_, SENTENCES_COUNT):
sentences_.append(str(sentence))
summm_ = " ".join(sentences_)
return summm_ |